<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="brief-report" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1269837</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2023.1269837</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Brief Research Report</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Genome of <italic>Linum usitatissimum</italic> convar. <italic>crepitans</italic> expands the view on the section <italic>Linum</italic>
</article-title>
<alt-title alt-title-type="left-running-head">Dvorianinova et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fgene.2023.1269837">10.3389/fgene.2023.1269837</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Dvorianinova</surname>
<given-names>Ekaterina M.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1055556/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Pushkova</surname>
<given-names>Elena N.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1056082/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bolsheva</surname>
<given-names>Nadezhda L.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/310628/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Borkhert</surname>
<given-names>Elena V.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/488866/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Rozhmina</surname>
<given-names>Tatiana A.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhernova</surname>
<given-names>Daiana A.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2412827/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Novakovskiy</surname>
<given-names>Roman O.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1055924/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Turba</surname>
<given-names>Anastasia A.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2388002/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sigova</surname>
<given-names>Elizaveta A.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2412969/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Melnikova</surname>
<given-names>Nataliya V.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/266277/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Dmitriev</surname>
<given-names>Alexey A.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/336564/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Engelhardt Institute of Molecular Biology</institution>, <institution>Russian Academy of Sciences</institution>, <addr-line>Moscow</addr-line>, <country>Russia</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Federal Research Center for Bast Fiber Crops</institution>, <addr-line>Torzhok</addr-line>, <country>Russia</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Faculty of Biology</institution>, <institution>Lomonosov Moscow State University</institution>, <addr-line>Moscow</addr-line>, <country>Russia</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Moscow Institute of Physics and Technology</institution>, <addr-line>Moscow</addr-line>, <country>Russia</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/840777/overview">Fakhriddin Kushanov</ext-link>, Academy of Sciences Republic of Uzbekistan (UzAS), Uzbekistan</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1466996/overview">Ritwika Das</ext-link>, Indian Agricultural Statistics Research Institute, Indian Council of Agricultural Research, India</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2203604/overview">Eman Tawfik</ext-link>, Helwan University, Egypt</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/653566/overview">Xuming Li</ext-link>, Hugo Biotechnologies Co., Ltd., China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1125117/overview">Wang Xiao</ext-link>, Chinese Academy of Sciences (CAS), China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Ekaterina M. Dvorianinova, <email>dvorianinova.em@phystech.edu</email>; Alexey A. Dmitriev, <email>alex_245@mail.ru</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>22</day>
<month>11</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1269837</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>07</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>24</day>
<month>10</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Dvorianinova, Pushkova, Bolsheva, Borkhert, Rozhmina, Zhernova, Novakovskiy, Turba, Sigova, Melnikova and Dmitriev.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Dvorianinova, Pushkova, Bolsheva, Borkhert, Rozhmina, Zhernova, Novakovskiy, Turba, Sigova, Melnikova and Dmitriev</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Sequencing whole plant genomes provides a solid foundation for applied and basic studies. Genome sequences of agricultural plants attract special attention, as they reveal information on the regulation of beneficial plant traits. Flax is a valuable crop cultivated for oil and fiber. Genome sequences of its representatives are rich sources of genetic information for the improvement of cultivated forms of the plant. In our work, we sequenced the first genome of flax with the dehiscence of capsules&#x2014;<italic>Linum usitatissimum</italic> convar. <italic>&#x441;repitans</italic> (Boenn.) Dumort&#x2014;on the Oxford Nanopore Technologies (ONT) and Illumina platforms. We obtained 23&#xa0;Gb of raw ONT data and 89&#xa0;M of 150 &#x2b; 150 paired-end Illumina reads and tested different tools for genome assembly and polishing. The genome assembly produced according to the Canu&#x2014;Racon &#xd7;2&#x2014;medaka&#x2014;POLCA scheme had optimal contiguity and completeness: assembly length&#x2014;412.6&#xa0;Mb, N50&#x2014;5.2&#xa0;Mb, L50&#x2014;28, and complete BUSCO&#x2014;94.6% (64.0% duplicated, eudicots_odb10). The obtained high-quality genome assembly of <italic>L. usitatissimum</italic> convar. <italic>crepitans</italic> provides opportunities for further studies of evolution, domestication, and genome regulation in the section <italic>Linum</italic>.</p>
</abstract>
<kwd-group>
<kwd>flax</kwd>
<kwd>
<italic>Linum usitatissimum</italic> convar. <italic>crepitans</italic>
</kwd>
<kwd>section <italic>Linum</italic>
</kwd>
<kwd>nanopore sequencing</kwd>
<kwd>
<italic>de novo</italic> genome assembly</kwd>
</kwd-group>
<contract-num rid="cn001">075-15-2021-1064</contract-num>
<contract-sponsor id="cn001">Ministry of Science and Higher Education of the Russian Federation<named-content content-type="fundref-id">10.13039/501100012190</named-content>
</contract-sponsor>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Genomics of Plants and the Phytoecosystem</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Plant genomes demonstrate high variability in size and content (<xref ref-type="bibr" rid="B20">Li et al., 2022</xref>; <xref ref-type="bibr" rid="B36">Sun et al., 2022</xref>). Genome sequences enable studying the beneficial features of agricultural plants and modifying and improving the desired traits (<xref ref-type="bibr" rid="B25">N&#xfc;tzmann et al., 2016</xref>; <xref ref-type="bibr" rid="B30">Sedeek et al., 2019</xref>; <xref ref-type="bibr" rid="B40">Wang et al., 2020</xref>; <xref ref-type="bibr" rid="B6">Choudhury et al., 2022</xref>; <xref ref-type="bibr" rid="B33">Singh et al., 2022</xref>; <xref ref-type="bibr" rid="B37">Tello-Ruiz et al., 2022</xref>). Therefore, plant genomics and pan-genomics open vast opportunities for breeding and agriculture. Knowledge of genome structure can unveil the mechanisms of regulation of key agricultural traits and highlight possible large-scale differences between the representatives of a taxon. In addition, plant genomes can spur studies on the evolution, domestication, and adaptation processes and the emergence of metabolic diversity driven by whole genome duplication (<xref ref-type="bibr" rid="B35">Song et al., 2021</xref>; <xref ref-type="bibr" rid="B12">El Karkouri et al., 2022</xref>; <xref ref-type="bibr" rid="B27">Petereit et al., 2022</xref>; <xref ref-type="bibr" rid="B46">Zhou and Liu, 2022</xref>; <xref ref-type="bibr" rid="B1">Bartlett et al., 2023</xref>).</p>
<p>
<italic>Linum usitatissimum</italic> L. is a dual-purpose agricultural plant providing two main raw products of multipurpose use&#x2014;seed and fiber (<xref ref-type="bibr" rid="B24">Nag et al., 2015</xref>). Flax seed is a source of biologically active compounds beneficial for human health (<xref ref-type="bibr" rid="B14">Kezimana et al., 2018</xref>; <xref ref-type="bibr" rid="B34">Sirotkin, 2023</xref>). Flax seed in animal feed also causes positive effects on immunity and growth (<xref ref-type="bibr" rid="B29">Salem et al., 2023</xref>). Flax oil of a certain fatty acid composition is actively used in the coating industry (<xref ref-type="bibr" rid="B41">Wang and Padua, 2005</xref>; <xref ref-type="bibr" rid="B9">Dmitriev et al., 2020a</xref>). In addition to the use in textile production (<xref ref-type="bibr" rid="B38">Van der Werf and Turunen, 2008</xref>), flax fiber serves as a component of composite materials (<xref ref-type="bibr" rid="B22">More, 2022</xref>). Flax biomass can be used as a source of bioenergy (<xref ref-type="bibr" rid="B2">Batog et al., 2023</xref>). Thus, <italic>L. usitatissimum</italic> is an important agricultural crop, and data on its diversity at the genome level can be implicated in breeding and understanding the evolution in the section <italic>Linum</italic>.</p>
<p>Genome sequences of flax representatives are useful sources of information for both basic and applied studies. Currently, seven <italic>L. usitatissimum</italic> assemblies are available in the databases (NCBI and Zenodo) (<xref ref-type="bibr" rid="B43">You et al., 2018</xref>; <xref ref-type="bibr" rid="B10">Dmitriev et al., 2020b</xref>; <xref ref-type="bibr" rid="B44">Zhang et al., 2020</xref>; <xref ref-type="bibr" rid="B28">Sa et al., 2021</xref>; <xref ref-type="bibr" rid="B11">Dvorianinova et al., 2022</xref>; <xref ref-type="bibr" rid="B45">Zhao et al., 2023</xref>). In the species of the section <italic>Linum</italic>, apart from <italic>L. usitatissimum</italic>, a genome of <italic>Linum bienne</italic> Mill. (considered to be a wild ancestor of cultivated flax) is available in the NCBI database (<xref ref-type="bibr" rid="B44">Zhang et al., 2020</xref>). Our study aimed at assembling a high-quality genome of <italic>L. usitatissimum</italic> convar. <italic>crepitans</italic> (Boenn.) Dumort. Convar. <italic>crepitans</italic> is a group of flax varieties with spontaneously opening capsules. It has been cultivated for fiber in Europe, but now it is not in use since seed shattering significantly complicates harvesting. However, it can be found in germplasm collections. The main feature of the convar. <italic>crepitans</italic> is the dehiscence of its capsules, but in other ways, it is quite similar to <italic>L. usitatissimum</italic> convar. <italic>usitatissimum</italic> (<xref ref-type="bibr" rid="B23">Muir and Westcott, 2003</xref>). The genetic resource of the convar. <italic>crepitans</italic> is limited (<xref ref-type="bibr" rid="B7">Diederichsen, 2019</xref>). Nevertheless, the investigation of this convar. can significantly broaden the data on genetic diversity and domestication of <italic>L. usitatissimum</italic>. The genome assembly of the convar. <italic>crepitans</italic> can be incorporated in pan-genomic studies of flax, including the construction of pan-genome, mining key agricultural traits, and establishing the evolution of flax forms.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>2 Material and methods</title>
<sec id="s2-1">
<title>2.1 Plant material</title>
<p>The seeds of <italic>L</italic>. <italic>usitatissimum</italic> convar. <italic>crepitans</italic> K-1531 were provided by the Institute for Flax (Torzhok, Russia). The seeds were sterilized in a 1% NaClO solution for 5&#xa0;min and then germinated on Petri dishes. High-quality seedlings were transplanted into the soil and grown for 3&#x2013;4&#xa0;weeks. After that, the tops of the plant branches were covered with a dark cloth to prevent exposure to light for 1&#xa0;week. This step was important to minimize the level of metabolites in flax leaves before DNA extraction. The leaves were collected, frozen in liquid nitrogen, and stored at &#x2212;70&#xb0;C until DNA isolation.</p>
</sec>
<sec id="s2-2">
<title>2.2 DNA extraction</title>
<p>Nucleus isolation and DNA extraction were performed according to the previously developed protocol (<xref ref-type="bibr" rid="B11">Dvorianinova et al., 2022</xref>). Additionally, part of the DNA was purified using the Circulomics Short Read Eliminator kit (SRE kit, Circulomics, United States). DNA concentration and quality were assessed using a Qubit fluorometer (Thermo Fisher Scientific, United States) and a NanoDrop spectrophotometer (Thermo Fisher Scientific), as well as by electrophoresis in 0.3% agarose gel.</p>
</sec>
<sec id="s2-3">
<title>2.3 Nanopore and Illumina sequencing</title>
<p>Three libraries were prepared for Nanopore sequencing according to the manufacturer&#x2019;s protocol for SQK-LSK109 and SQK-LSK114 kits (Oxford Nanopore Technologies (ONT), United Kingdom). The first one was prepared from the SRE-purified DNA using the SQK-LSK109 kit (ONT) and sequenced on the FLO-MIN-106D R9.4.1 flow cell (ONT). The second one was prepared from the SRE-purified DNA using the SQK-LSK114 kit (ONT) and sequenced on the FLO-MIN-114 R10.4.1 flow cell (400&#xa0;bps mode, ONT). The third one was prepared from the non-treated DNA using the SQK-LSK109 kit (ONT) and sequenced on the FLO-MIN-106D R9.4.1 flow cell (ONT).</p>
<p>An Illumina DNA library was prepared using the NEBNext Ultra II DNA Library Prep Kit for Illumina (New England BioLabs, United Kingdom) according to the manufacturer&#x2019;s protocol. Sequencing was performed on a NovaSeq 6000 (Illumina, United States) instrument with a read length of 150 &#x2b; 150&#xa0;bp.</p>
</sec>
<sec id="s2-4">
<title>2.4 Data analysis</title>
<p>Raw FAST5 sequences were converted into FASTQ format by Guppy 6.4.6 using the super accuracy flip-flop algorithm (dna_r9.4.1_450bps_sup.cfg, dna_r10.4.1_e8.2_400bps_sup.cfg) and quality filtering (--min_qscore 8). The adapter sequences were removed with Porechop (<ext-link ext-link-type="uri" xlink:href="https://github.com/rrwick/Porechop">https://github.com/rrwick/Porechop</ext-link>).</p>
<p>Draft genomes were assembled using Canu 2.2 (<xref ref-type="bibr" rid="B16">Koren et al., 2017</xref>) (set parameter: genome size &#x3d; 400&#xa0;m), Flye 2.9 (<xref ref-type="bibr" rid="B15">Kolmogorov et al., 2019</xref>) (set parameters: &#x201c;--genome size 400&#xa0;m,&#x201d; &#x201c;--nano-raw&#x201d;), GoldRush (<xref ref-type="bibr" rid="B42">Wong et al., 2023</xref>) (set parameter: G &#x3d; 4e6), and NECAT (<xref ref-type="bibr" rid="B5">Chen et al., 2021</xref>). Assembly quality was evaluated by the QUAST parameters (QUAST 5.0.2) (<xref ref-type="bibr" rid="B13">Gurevich et al., 2013</xref>) and the presence of universal single-copy orthologs (BUSCO 4.1.2, eudicots_odb10) (<xref ref-type="bibr" rid="B32">Sim&#xe3;o et al., 2015</xref>). For the reference-based QUAST assessment, we used the first version of the genome and annotation of the <italic>L. usitatissimum</italic> variety CDC Bethune (<ext-link ext-link-type="uri" xlink:href="https://ftp.ncbi.nlm.nih.gov/genomes/genbank/plant/Linum_usitatissimum/all_assembly_versions/GCA_000224295.1_LinUsi_v1.1/">https://ftp.ncbi.nlm.nih.gov/genomes/genbank/plant/Linum_usitatissimum/all_assembly_versions/GCA_000224295.1_LinUsi_v1.1/</ext-link>, GCA_000224295.1_LinUsi_v1.1_genomic.fna.gz, GCA_000224295.1_LinUsi_v1.1_genomic.gff.gz, and GCA_000224295.1).</p>
<p>To improve the quality of the draft assembly of the convar. <italic>crepitans</italic> genome, polishing was performed using ONT reads: Racon 1.5.0 (<xref ref-type="bibr" rid="B39">Vaser et al., 2017</xref>) (polishing with both R9.4.1 and R10.4.1 reads) and medaka 1.8.0 (<ext-link ext-link-type="uri" xlink:href="https://github.com/nanoporetech/medaka">https://github.com/nanoporetech/medaka</ext-link>) (-m r1041_e82_400bps_fast_g615; polishing with R10.4.1 reads). Illumina reads were trimmed (trailing:30) and filtered (minlen:50) using Trimmomatic 0.38 (<xref ref-type="bibr" rid="B3">Bolger et al., 2014</xref>) and then used for final polishing by POLCA from MaSuRCA 4.0.1 (<xref ref-type="bibr" rid="B47">Zimin et al., 2013</xref>).</p>
<p>To align Illumina reads to the final genome assembly of the convar. <italic>crepitans</italic>, BWA-MEM (<xref ref-type="bibr" rid="B18">Li, 2013</xref>) was used. To calculate the coverage percentage of the final genome assembly with Illumina reads, SAMtools depth (<xref ref-type="bibr" rid="B19">Li et al., 2009</xref>) (set parameters: -q0 -Q0) was run on the generated bam file, and the number of covered positions was calculated with the &#x201c;wc -l&#x201d; bash command.</p>
<p>Repeat content of <italic>L. usitatissimum</italic> genome assemblies was calculated with LTR_retriever 2.9.0 (<xref ref-type="bibr" rid="B26">Ou and Jiang, 2018</xref>), which includes the BuildDatabase (default parameters), RepeatModeler (&#x201c;-engine ncbi&#x201d;), and RepeatMasker (&#x201c;consensi.fa.classified&#x201d; file as input) modules.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<p>To assemble a high-quality genome of <italic>L. usitatissimum</italic> convar. <italic>crepitans</italic>, we performed whole-genome sequencing on the ONT and Illumina platforms. Three DNA libraries were prepared for ONT sequencing. In two DNA pools, short fragments were eliminated using the SRE kit (Circulomics, United States). For these DNA pools enriched with long fragments, we received 7.2&#xa0;Gb (R9.4.1 flow cell) and 6.2&#xa0;Gb (R10.4.1 flow cell) of raw ONT data with an N50 of 22.9 and 21.8&#xa0;kb, respectively. For the library from the non-treated DNA, we received 9.6&#xa0;Gb (R9.4.1 flow cell) of raw ONT data with an N50 of 17.3&#xa0;kb. After basecalling and adapter trimming, a total of 15.2&#xa0;Gb of ONT data with an N50 of 21.8&#xa0;kb remained. Then, we assembled draft genomes using Canu and Flye, which performed best in our previous study (<xref ref-type="bibr" rid="B11">Dvorianinova et al., 2022</xref>), as well as GoldRush and NECAT, which were not tested by us earlier.</p>
<p>The expected size of the <italic>L. usitatissimum</italic> genome was 400&#x2013;450&#xa0;Mb (<xref ref-type="bibr" rid="B43">You et al., 2018</xref>; <xref ref-type="bibr" rid="B28">Sa et al., 2021</xref>; <xref ref-type="bibr" rid="B11">Dvorianinova et al., 2022</xref>). Given the same size for the convar. <italic>crepitans</italic>, only Canu produced an assembly of a reasonable length&#x2014;416.3&#xa0;Mb (<xref ref-type="fig" rid="F1">Figure 1</xref>). The assembly had an N50 of 5.2&#xa0;Mb and the BUSCO completeness of 94.2% (eudicots_odb10). The assembly by NECAT had the same percentage of complete BUSCO and the highest N50 (7.2&#xa0;Mb). However, the assembly length (374.5&#xa0;Mb) was smaller than the expected one and might indicate the absence of important non-coding elements, e.g., repeats. Flye produced an assembly of an even smaller length&#x2014;323.9&#xa0;Mb. GoldRush demonstrated the worst performance among the tested software. The assembly was only 298.9&#xa0;Mb long, had an N50 in the kb-range, and the BUSCO completeness of 66.6%.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>QUAST and BUSCO statistics for the <italic>L. usitatissimum</italic> convar. <italic>crepitans</italic> genome assemblies obtained with different tools. The green (best)&#x2013;yellow&#x2013;red (worst) color scale represents the quality of the values. BUSCO (eudicots_odb10): C&#x2014;complete, D&#x2014;duplicated, and F&#x2014;fragmented. Genomic features: complete &#x2b; partial; the detected feature from a reference genome is considered partial if it is covered by at least 100&#xa0;bp.</p>
</caption>
<graphic xlink:href="fgene-14-1269837-g001.tif"/>
</fig>
<p>The received draft assemblies were also assessed by the reference-based QUAST statistics (<xref ref-type="fig" rid="F1">Figure 1</xref>). As a reference, we used the first version of the <italic>L. usitatissimum</italic> CDC Bethune genome (GCA_000224295.1) because it was assembled from accurate Illumina reads and annotated. Using a reference genome based on Illumina data is beneficial, as it contains errors different from those in a genome assembled from ONT data. In addition, the availability of annotation of the reference genome enabled us to calculate important QUAST statistics, e.g., the number of reference genomic features. The assembly by Canu had the highest fraction of the reference genome covered and the highest number of complete reference genomic features. The assembly by Flye had the lowest relative number of mismatches/indels. However, the accuracy of the obtained genome sequences can be improved by the polishing procedure. Therefore, we chose the assembly by Canu as optimal due to its length and the received parameters of contiguity and completeness.</p>
<p>Next, we improved the accuracy of the Canu-assembled sequences by polishing. To select polishers, we relied on the results of our previous studies. Two rounds of genome polishing with Racon and one round of polishing with medaka was the best combination for ONT reads (<xref ref-type="bibr" rid="B10">Dmitriev et al., 2020b</xref>; <xref ref-type="bibr" rid="B17">Krasnov et al., 2020</xref>; <xref ref-type="bibr" rid="B21">Melnikova et al., 2021</xref>; <xref ref-type="bibr" rid="B11">Dvorianinova et al., 2022</xref>). Therefore, we used this scheme for the genome of the convar. <italic>crepitans</italic> (<xref ref-type="fig" rid="F2">Figure 2</xref>). Two iterations of Racon significantly decreased the relative number of mismatches and especially indels (by &#x223c;2 times). The percentage of complete BUSCO and the number of complete reference genomic features increased. Polishing using medaka further improved the reference-based QUAST statistics. However, it slightly reduced the percentage of complete BUSCO (by 0.1%) and strongly reduced the percentage of duplicated BUSCO (by 1.9%). After all iterations of polishing with ONT reads (Racon &#xd7;2&#x2014;medaka), the assembly length decreased by &#x223c;4&#xa0;Mb, compared to that of the draft assembly.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>QUAST and BUSCO statistics for the Canu-assembled <italic>L. usitatissimum</italic> convar. <italic>crepitans</italic> genome polished with different tools. The green (best)&#x2013;yellow&#x2013;red (worst) color scale represents the quality of the values. BUSCO (eudicots_odb10): C&#x2014;complete, D&#x2014;duplicated, and F&#x2014;fragmented. Genomic features: complete &#x2b; partial; the detected feature from a reference genome is considered partial if it is covered by at least 100&#xa0;bp.</p>
</caption>
<graphic xlink:href="fgene-14-1269837-g002.tif"/>
</fig>
<p>To improve the assembly accuracy to the maximum extent, we additionally polished the convar. <italic>crepitans</italic> genome (Canu&#x2014;Racon &#xd7;2&#x2014;medaka) with the generated Illumina data (89&#xa0;M of 150 &#x2b; 150 paired-end reads). According to our previous studies, POLCA was the most effective tool for Illumina reads (<xref ref-type="bibr" rid="B10">Dmitriev et al., 2020b</xref>; <xref ref-type="bibr" rid="B17">Krasnov et al., 2020</xref>; <xref ref-type="bibr" rid="B21">Melnikova et al., 2021</xref>). As a result of this procedure, the BUSCO completeness increased to 94.6% (by 0.2%), and the percentage of duplicated BUSCO increased to 64.0% (by 2.0%) (<xref ref-type="fig" rid="F2">Figure 2</xref>). Thus, it eliminated the negative effect of medaka polishing, which caused the reduction in the parameter. Polishing with Illumina data also significantly increased assembly accuracy, according to the reference-based QUAST statistics.</p>
<p>In addition to polishing the draft Canu-assembled genome with both ONT and Illumina data, we tested whether it was possible to reach the same or better results using only Illumina reads or omitting the step of polishing by medaka. Thus, we polished the Canu and Canu&#x2014;Racon &#xd7;2 assemblies with POLCA. The assembly polished using Racon (two iterations), medaka, and POLCA was more complete and accurate than the assemblies polished by Racon and POLCA or only POLCA (<xref ref-type="fig" rid="F2">Figure 2</xref>). It had more complete reference genomic features and a lower relative number of mismatches and indels. However, the Canu&#x2013;Racon &#xd7;2&#x2014;medaka&#x2014;POLCA assembly had a slightly lower percentage of duplicated BUSCO than the other two polished assemblies (Canu&#x2014;Racon &#xd7;2&#x2014;POLCA and Canu&#x2014;POLCA), by 0.3% and 0.1%, respectively. Compared to genome assemblies polished using both ONT and Illumina reads, the assembly polished only using Illumina reads (Canu&#x2014;POLCA) had significantly worse statistics of accuracy. Therefore, polishing with ONT reads could not be replaced with polishing only with short accurate reads.</p>
<p>Thus, the Canu&#x2014;Racon &#xd7;2&#x2014;medaka&#x2014;POLCA scheme produced the most contiguous and complete assembly: length&#x2014;412.6&#xa0;Mb, N50&#x2014;5.2&#xa0;Mb, L50&#x2014;28, and complete BUSCO&#x2014;94.6%. Mapping Illumina reads to the convar. <italic>crepitans</italic> genome revealed that more than 398.5 million nucleotide positions were covered (96.6% of the sequence). According to SAMtools flagstat, 98.6% of the passed Illumina reads were mapped to the assembled genome. This indicated that the obtained genome assembly is of reasonable length and high completeness.</p>
<p>To compare the assembly of <italic>L. usitatissimum</italic> convar. <italic>crepitans</italic> with the available <italic>L. usitatissimum</italic> and <italic>L. bienne</italic> assemblies, the genomes were downloaded from the NCBI and Zenodo databases: 3896 (GCA_030674075.1), Atlant (GCA_014858635.1), Neiya No. 9 (<ext-link ext-link-type="uri" xlink:href="https://zenodo.org/record/7811972">https://zenodo.org/record/7811972</ext-link>), YY5 v.2 (<ext-link ext-link-type="uri" xlink:href="https://zenodo.org/record/4872894">https://zenodo.org/record/4872894</ext-link>), CDC Bethune v.1 and v.2 (GCA_000224295.1, GCA_000224295.2), Heiya 14 (GCA_010665265.1), Longya 10 (GCA_010665275.2), and <italic>L. bienne</italic> 15003 (GCA_010665285.1). For the downloaded assemblies, QUAST statistics were taken from the NCBI and Zenodo assembly descriptions (for the contig level) or calculated. To calculate BUSCO statistics, the eudicots_odb10 dataset was used. Among the analyzed genomes, the assembly of the convar. <italic>crepitans</italic> had one of the highest N50 and was the second most complete genome (after the assembly of Neiya No. 9), according to BUSCO statistics (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>QUAST and BUSCO (C&#x2014;complete, D&#x2014;duplicated, and F&#x2014;fragmented; eudicots_odb10) statistics and repeat content for the obtained <italic>L. usitatissimum</italic> convar. <italic>crepitans</italic> assembly (marked bold) and <italic>L. usitatissimum</italic> and <italic>L. bienne</italic> genome assemblies available in databases.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="center">Flax variety</th>
<th rowspan="2" align="center">Sequencing platform</th>
<th rowspan="2" align="center">Assembly length, Mb</th>
<th rowspan="2" align="center">N50 (contig), Mb</th>
<th rowspan="2" align="center">Number of contigs</th>
<th colspan="3" align="center">BUSCO</th>
<th rowspan="2" align="center">Total interspersed repeats, %</th>
</tr>
<tr>
<th align="center">C, %</th>
<th align="center">D, %</th>
<th align="center">F, %</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">3896</td>
<td align="center">ONT</td>
<td align="center">447.1</td>
<td align="center">6.2</td>
<td align="center">1,695</td>
<td align="center">93.8</td>
<td align="center">62.3</td>
<td align="center">0.7</td>
<td align="center">49.3</td>
</tr>
<tr>
<td align="center">Atlant</td>
<td align="center">ONT and Illumina</td>
<td align="center">361.8</td>
<td align="center">0.4</td>
<td align="center">2,458</td>
<td align="center">94.4</td>
<td align="center">63.4</td>
<td align="center">0.7</td>
<td align="center">44.7</td>
</tr>
<tr>
<td align="center">Neiya No. 9</td>
<td align="center">PacBio HiFi and Illumina</td>
<td align="center">473.6</td>
<td align="center">0.9</td>
<td align="center">6,099</td>
<td align="center">94.8</td>
<td align="center">72.4</td>
<td align="center">1.2</td>
<td align="center">54.8</td>
</tr>
<tr>
<td align="center">YY5 v.2</td>
<td align="center">PacBio HiFi and BGI</td>
<td align="center">455.0</td>
<td align="center">9.6</td>
<td align="center">336</td>
<td align="center">94.5</td>
<td align="center">63.1</td>
<td align="center">0.7</td>
<td align="center">50.1</td>
</tr>
<tr>
<td align="center">
<bold>convar. <italic>crepitans</italic> K-1531</bold>
</td>
<td align="center">ONT and Illumina</td>
<td align="center">
<bold>412.6</bold>
</td>
<td align="center">
<bold>5.2</bold>
</td>
<td align="center">
<bold>1,483</bold>
</td>
<td align="center">
<bold>94.6</bold>
</td>
<td align="center">
<bold>64.0</bold>
</td>
<td align="center">
<bold>0.7</bold>
</td>
<td align="center">
<bold>49.9</bold>
</td>
</tr>
<tr>
<td align="center">CDC Bethune v.1</td>
<td align="center">Illumina</td>
<td align="center">282.2</td>
<td align="center">0.02</td>
<td align="center">48,397</td>
<td align="center">93.9</td>
<td align="center">60.4</td>
<td align="center">1.3</td>
<td align="center">33.3</td>
</tr>
<tr>
<td align="center">CDC Bethune v.2</td>
<td align="center">Illumina</td>
<td align="center">316.2</td>
<td align="center">0.02</td>
<td align="center">24,829</td>
<td align="center">93.7</td>
<td align="center">57.4</td>
<td align="center">0.9</td>
<td align="center">27.7</td>
</tr>
<tr>
<td align="center">Heiya 14</td>
<td align="center">Illumina</td>
<td align="center">303.7</td>
<td align="center">0.3</td>
<td align="center">4,581</td>
<td align="center">94.5</td>
<td align="center">62.6</td>
<td align="center">0.9</td>
<td align="center">36.1</td>
</tr>
<tr>
<td align="center">Longya 10</td>
<td align="center">Illumina</td>
<td align="center">306.4</td>
<td align="center">0.2</td>
<td align="center">4,419</td>
<td align="center">94.4</td>
<td align="center">60.5</td>
<td align="center">0.9</td>
<td align="center">36.0</td>
</tr>
<tr>
<td align="center">
<italic>L. bienne</italic> 15003</td>
<td align="center">Illumina</td>
<td align="center">293.6</td>
<td align="center">0.1</td>
<td align="center">6,369</td>
<td align="center">93.3</td>
<td align="center">50.4</td>
<td align="center">1.3</td>
<td align="center">36.3</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The obtained convar. <italic>crepitans</italic> assembly contained 49.9% of total interspersed repeats (<xref ref-type="table" rid="T1">Table 1</xref>) per &#x223c;413&#xa0;Mb (assembly length). Meanwhile, <italic>L. usitatissimum</italic> genome assemblies from long reads had 44.7%&#x2013;54.8% of repetitive sequences per 362&#x2013;474&#xa0;Mb. Flax genome assemblies from short reads comprised only 27.7%&#x2013;36.3% of total interspersed repeats and had a smaller size (294&#x2013;316&#xa0;Mb).</p>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussion</title>
<p>Plant genomes became the foundation of studies on the regulation of genetic features and their involvement in metabolic pathways, species evolution, and adaptation. Currently, genome sequencing is routine but relevant for agricultural plants. The genomes of crops are indispensable for modern breeding based on molecular procedures and targeted improvement of valuable plant features (<xref ref-type="bibr" rid="B8">Dmitriev et al., 2022</xref>). Furthermore, the availability of several diverse genome sequences for a species is key to the discovery of novel useful agricultural traits. For <italic>L. usitatissimum</italic>, seven genome sequences of different varieties were received earlier (<xref ref-type="bibr" rid="B43">You et al., 2018</xref>; <xref ref-type="bibr" rid="B10">Dmitriev et al., 2020b</xref>; <xref ref-type="bibr" rid="B44">Zhang et al., 2020</xref>; <xref ref-type="bibr" rid="B28">Sa et al., 2021</xref>; <xref ref-type="bibr" rid="B11">Dvorianinova et al., 2022</xref>; <xref ref-type="bibr" rid="B45">Zhao et al., 2023</xref>). In this work, we sequenced the genome of <italic>L. usitatissimum</italic> convar. <italic>crepitans</italic> which is no longer cultivated due to the dehiscence of capsules. However, such unused genomic material can still be the source of valuable agricultural features.</p>
<p>To obtain the genome of the convar. <italic>crepitans</italic>, we performed DNA sequencing on the Oxford Nanopore Technologies and Illumina platforms. We assembled the received data using a range of software and calculated quality statistics. Different assemblers were tested in our previous work on their efficacy in constructing the genome of <italic>L. usitatissimum</italic> line 3896 (<xref ref-type="bibr" rid="B11">Dvorianinova et al., 2022</xref>). Most of the tested software (miniasm, NextDenovo, Raven, Shasta, SMARTdenovo, and wtdbg2) demonstrated poor QUAST and BUSCO statistics or assembled a genome of a significantly smaller size than the expected one. In our work on sequencing the genome of the Atlant cultivar, two tested tools (Shasta and wtdbg2) also showed poor performance (<xref ref-type="bibr" rid="B10">Dmitriev et al., 2020b</xref>). Therefore, we decided not to include the aforementioned assemblers in our current analysis and focused on the recently released tools and those that showed the best results.</p>
<p>Thus, to obtain draft assemblies, we used Canu, Flye, NECAT, and GoldRush. Canu, the most CPU time-consuming tool, still demonstrated the best performance in terms of assembly completeness and contiguity, including assembly size. NECAT produced the assembly with the highest N50 and the fewest number of contigs but of a size smaller than the expected one (400&#x2013;450&#xa0;Mb) and &#x223c;42&#xa0;Mb smaller than that for the assembly by Canu. Both assemblies had the same BUSCO completeness. Flye assembled a genome with QUAST and BUSCO statistics that was significantly worse but comparable to those of the assemblies by Canu and NECAT. At the same time, the assembly by Flye had the smallest relative number of mismatches/indels. Possibly, this could be due to the included polishing module (<xref ref-type="bibr" rid="B15">Kolmogorov et al., 2019</xref>). However, despite the achieved accuracy, the whole genome sequence still missed 20%&#x2013;30% of the expected genome size. GoldRush was unable to produce a genome with reasonable statistics. Thus, we considered the assembly by Canu optimal.</p>
<p>To improve the accuracy of the obtained genome assembly, one can apply a polishing procedure. The Canu-assembled genome was polished using ONT reads by the Racon (two iterations, both R.9.4.1 and R10.4.1 reads) and medaka (R10.4.1 reads) polishers. Each of the two rounds of Racon increased BUSCO completeness and the number of complete reference genomic features in the assembly. The procedure also decreased the relative number of mismatches and indels by 12.5% and 46.1%, respectively. Sequencing data from R9.4.1 flow cells are more inaccurate than those from R10.4.1 flow cells (<xref ref-type="bibr" rid="B31">Sereika et al., 2022</xref>). Thus, in our previous study, polishing with ONT data only from R9.4.1 flow cells had a less dramatic effect (<xref ref-type="bibr" rid="B11">Dvorianinova et al., 2022</xref>). Polishing with medaka showed the same trend in statistic values as polishing with Racon. Final polishing with Illumina reads by POLCA also improved QUAST and BUSCO parameters. However, skipping polishing with ONT reads and polishing only with Illumina reads was not as beneficial as using both ONT and Illumina data. BUSCO completeness was almost the same for assemblies obtained according to Canu&#x2014;POLCA and Canu&#x2014;Racon &#xd7;2&#x2014;medaka&#x2014;POLCA. However, more mismatches/indels remained in the assembly polished only with Illumina reads. Thus, the final optimal assembly was obtained using the Canu&#x2014;Racon &#xd7;2&#x2014;medaka&#x2014;POLCA scheme (<xref ref-type="fig" rid="F3">Figure 3</xref>). The assembly had a size of 412.6&#xa0;Mb, consisted of 1,483 contigs, had an N50 of 5.2&#xa0;Mb, and a BUSCO completeness of 94.6%.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>The scheme used to obtain the final genome assembly of <italic>L. usitatissimum</italic> convar. <italic>crepitans</italic>.</p>
</caption>
<graphic xlink:href="fgene-14-1269837-g003.tif"/>
</fig>
<p>BUSCO completeness of the obtained assembly was higher than that of the available assemblies for <italic>L. usitatissimum</italic>. Its length and repeat content were expectedly greater than these parameters of the assemblies obtained from short reads (varieties CDC Bethune, Longya 10, Heiya 14; <italic>L. bienne</italic> 15003). However, the repeat content in the genome of the convar. <italic>crepitans</italic> was similar to that of the assemblies from long reads (varieties 3896, Atlant, Neiya No. 9, and YY5 v.2). Thus, the non-coding sequences in the assembly are likely complete<italic>.</italic> The percentage of duplicated BUSCO in the obtained assembly was also high (above 60%) and comparable to that of <italic>L. usitatissimum</italic> assemblies. This fact correlates with the idea of <italic>L. usitatissimum</italic> origin. The species might have originated from the crossing of two <italic>Linum</italic> species. Then, the genome of the progeny probably underwent diploidization. Thus, the resulting ploidy of most genomic features is four (<xref ref-type="bibr" rid="B4">Bolsheva et al., 2017</xref>).</p>
<p>The assembled genome of the convar. <italic>crepitans</italic> has a quality comparable to that of the line 3896&#x2014;the NCBI reference genome for <italic>L. usitatissimum</italic>. The line 3896 genome was assembled and polished using ONT reads (<xref ref-type="bibr" rid="B11">Dvorianinova et al., 2022</xref>). Meanwhile, the genome of the convar. <italic>crepitans</italic> was assembled from ONT data and additionally polished with both ONT and Illumina reads. Thus, the assembly of the convar. <italic>crepitans</italic> has more complete BUSCO likely due to the improvement with accurate Illumina data. However, its contig N50 is lower than that of the assembly of line 3896 or variety YY5. In general, the obtained genome of the convar. <italic>crepitans</italic> has a quality close to that of most flax assemblies from long reads and outperformed the assemblies from short reads. Nevertheless, its level can still be upgraded to the chromosome one, e.g., using Hi-C data.</p>
<p>In this work, we sequenced the first genome of <italic>L. usitatissimum</italic> convar. <italic>crepitans</italic>. The volume and quality of the obtained data were sufficient to produce a high-quality assembly with QUAST and BUSCO statistics that were superior or close to those of the available <italic>L. usitatissimum</italic> genomes. Its quality level can be additionally upgraded to the scaffold and chromosome level. Our data allow investigating the diversity and evolution of the section <italic>Linum</italic> as well as mining key traits for breeding.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found as follows: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, PRJNA1006423.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>ED: writing&#x2013;original draft, writing&#x2013;review and editing, and investigation. EP: writing&#x2013;review and editing and investigation. NB: writing&#x2013;review and editing and investigation. EB: writing&#x2013;review and editing and investigation. TR: writing&#x2013;review and editing and investigation. DZ: writing&#x2013;review and editing and investigation. RN: writing&#x2013;review and editing and investigation. AT: writing&#x2013;review and editing and investigation. ES: writing&#x2013;review and editing and investigation. NM: conceptualization, writing&#x2013;original draft, writing&#x2013;review and editing and investigation. AD: conceptualization, writing&#x2013;original draft, writing&#x2013;review and editing, and investigation.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. The work was financially supported by the Ministry of Science and Higher Education of the Russian Federation, grant number 075-15-2021-1064.</p>
</sec>
<ack>
<p>The authors would like to thank the Center for Precision Genome Editing and Genetic Technologies for Biomedicine, EIMB RAS for providing the computing power and techniques for the data analysis. This work was performed using the equipment of EIMB RAS &#x201c;Genome&#x201d; center (<ext-link ext-link-type="uri" xlink:href="http://www.eimb.ru/ru1/ckp/ccu_genome_ce.php">http://www.eimb.ru/ru1/ckp/ccu_genome_ce.php</ext-link>).</p>
</ack>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors, and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bartlett</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Moyers</surname>
<given-names>B. T.</given-names>
</name>
<name>
<surname>Man</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Subramaniam</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Makunga</surname>
<given-names>N. P.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>The power and perils of <italic>de novo</italic> domestication using genome editing</article-title>. <source>Annu. Rev. Plant Biol.</source> <volume>74</volume> (<issue>1</issue>), <fpage>727</fpage>&#x2013;<lpage>750</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-arplant-053122-030653</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Batog</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wawro</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gieparda</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Bujnowicz</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Foksowicz-Flaczyk</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Rojewski</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Effective use of flax biomass in biorefining processes</article-title>. <source>Appl. Sci.</source> <volume>13</volume> (<issue>13</issue>), <fpage>7359</fpage>. <pub-id pub-id-type="doi">10.3390/app13137359</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bolger</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Lohse</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Usadel</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Trimmomatic: a flexible trimmer for Illumina sequence data</article-title>. <source>Bioinformatics</source> <volume>30</volume> (<issue>15</issue>), <fpage>2114</fpage>&#x2013;<lpage>2120</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu170</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bolsheva</surname>
<given-names>N. L.</given-names>
</name>
<name>
<surname>Melnikova</surname>
<given-names>N. V.</given-names>
</name>
<name>
<surname>Kirov</surname>
<given-names>I. V.</given-names>
</name>
<name>
<surname>Speranskaya</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Krinitsina</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Dmitriev</surname>
<given-names>A. A.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Evolution of blue-flowered species of genus Linum based on high-throughput sequencing of ribosomal RNA genes</article-title>. <source>BMC Evol. Biol.</source> <volume>17</volume> (<issue>2</issue>), <fpage>253</fpage>. <pub-id pub-id-type="doi">10.1186/s12862-017-1105-x</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Nie</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>S.-Q.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>Y.-F.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Bray</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Efficient assembly of nanopore reads via highly accurate and intact error correction</article-title>. <source>Nat. Commun.</source> <volume>12</volume> (<issue>1</issue>), <fpage>60</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-020-20236-7</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Choudhury</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Deb</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kharbyngar</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Rajpal</surname>
<given-names>V. R.</given-names>
</name>
<name>
<surname>Rao</surname>
<given-names>S. R.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Dissecting the plant genome: through new generation molecular markers</article-title>. <source>Genet. Resour. Crop Evol.</source> <volume>69</volume> (<issue>8</issue>), <fpage>2661</fpage>&#x2013;<lpage>2698</lpage>. <pub-id pub-id-type="doi">10.1007/s10722-022-01441-3</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Diederichsen</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). &#x201c;<article-title>A taxonomic view on genetic resources in the genus Linum L. For flax breeding</article-title>,&#x201d; in <source>Genetics and genomics of Linum</source>. Editor <person-group person-group-type="editor">
<name>
<surname>Cullis</surname>
<given-names>C. A.</given-names>
</name>
</person-group> (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer International Publishing</publisher-name>), <fpage>1</fpage>&#x2013;<lpage>15</lpage>.</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dmitriev</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pushkova</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Melnikova</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Plant genome sequencing: modern technologies and novel opportunities for breeding</article-title>. <source>Mol. Biol.</source> <volume>56</volume> (<issue>4</issue>), <fpage>495</fpage>&#x2013;<lpage>507</lpage>. <pub-id pub-id-type="doi">10.1134/s0026893322040045</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dmitriev</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Kezimana</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Rozhmina</surname>
<given-names>T. A.</given-names>
</name>
<name>
<surname>Zhuchenko</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Povkhova</surname>
<given-names>L. V.</given-names>
</name>
<name>
<surname>Pushkova</surname>
<given-names>E. N.</given-names>
</name>
<etal/>
</person-group> (<year>2020a</year>). <article-title>Genetic diversity of SAD and FAD genes responsible for the fatty acid composition in flax cultivars and lines</article-title>. <source>BMC Plant Biol.</source> <volume>20</volume> (<issue>1</issue>), <fpage>301</fpage>. <pub-id pub-id-type="doi">10.1186/s12870-020-02499-w</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dmitriev</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Pushkova</surname>
<given-names>E. N.</given-names>
</name>
<name>
<surname>Novakovskiy</surname>
<given-names>R. O.</given-names>
</name>
<name>
<surname>Beniaminov</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Rozhmina</surname>
<given-names>T. A.</given-names>
</name>
<name>
<surname>Zhuchenko</surname>
<given-names>A. A.</given-names>
</name>
<etal/>
</person-group> (<year>2020b</year>). <article-title>Genome sequencing of fiber flax cultivar Atlant using Oxford Nanopore and Illumina platforms</article-title>. <source>Front. Genet.</source> <volume>11</volume>, <fpage>590282</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2020.590282</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dvorianinova</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Bolsheva</surname>
<given-names>N. L.</given-names>
</name>
<name>
<surname>Pushkova</surname>
<given-names>E. N.</given-names>
</name>
<name>
<surname>Rozhmina</surname>
<given-names>T. A.</given-names>
</name>
<name>
<surname>Zhuchenko</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Novakovskiy</surname>
<given-names>R. O.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Isolating Linum usitatissimum L. nuclear DNA enabled assembling high-quality genome</article-title>. <source>Int. J. Mol. Sci.</source> <volume>23</volume> (<issue>21</issue>), <fpage>13244</fpage>. <pub-id pub-id-type="doi">10.3390/ijms232113244</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>El Karkouri</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Ghigo</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Raoult</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Fournier</surname>
<given-names>P.-E.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Genomic evolution and adaptation of arthropod-associated Rickettsia</article-title>. <source>Sci. Rep.</source> <volume>12</volume> (<issue>1</issue>), <fpage>3807</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-022-07725-z</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gurevich</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Saveliev</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Vyahhi</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Tesler</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>QUAST: quality assessment tool for genome assemblies</article-title>. <source>Bioinformatics</source> <volume>29</volume> (<issue>8</issue>), <fpage>1072</fpage>&#x2013;<lpage>1075</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btt086</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kezimana</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Dmitriev</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Kudryavtseva</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Romanova</surname>
<given-names>E. V.</given-names>
</name>
<name>
<surname>Melnikova</surname>
<given-names>N. V.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Secoisolariciresinol diglucoside of flaxseed and its metabolites: biosynthesis and potential for nutraceuticals</article-title>. <source>Front. Genet.</source> <volume>9</volume>, <fpage>641</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2018.00641</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kolmogorov</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Yuan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Pevzner</surname>
<given-names>P. A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Assembly of long, error-prone reads using repeat graphs</article-title>. <source>Nat. Biotechnol.</source> <volume>37</volume> (<issue>5</issue>), <fpage>540</fpage>&#x2013;<lpage>546</lpage>. <pub-id pub-id-type="doi">10.1038/s41587-019-0072-8</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Koren</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Walenz</surname>
<given-names>B. P.</given-names>
</name>
<name>
<surname>Berlin</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Miller</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Bergman</surname>
<given-names>N. H.</given-names>
</name>
<name>
<surname>Phillippy</surname>
<given-names>A. M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Canu: scalable and accurate long-read assembly via adaptive k-mer weighting and repeat separation</article-title>. <source>Genome Res.</source> <volume>27</volume> (<issue>5</issue>), <fpage>722</fpage>&#x2013;<lpage>736</lpage>. <pub-id pub-id-type="doi">10.1101/gr.215087.116</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krasnov</surname>
<given-names>G. S.</given-names>
</name>
<name>
<surname>Pushkova</surname>
<given-names>E. N.</given-names>
</name>
<name>
<surname>Novakovskiy</surname>
<given-names>R. O.</given-names>
</name>
<name>
<surname>Kudryavtseva</surname>
<given-names>L. P.</given-names>
</name>
<name>
<surname>Rozhmina</surname>
<given-names>T. A.</given-names>
</name>
<name>
<surname>Dvorianinova</surname>
<given-names>E. M.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>High-quality genome assembly of Fusarium oxysporum f. sp. lini</article-title>. <source>Front. Genet.</source> <volume>11</volume>, <fpage>959</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2020.00959</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM</article-title>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1303.3997">https://arxiv.org/abs/1303.3997</ext-link>.</comment>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Handsaker</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wysoker</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fennell</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ruan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Homer</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>The sequence alignment/map format and SAMtools</article-title>. <source>bioinformatics</source> <volume>25</volume> (<issue>16</issue>), <fpage>2078</fpage>&#x2013;<lpage>2079</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp352</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xing</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Plant pan-genomics: recent advances, new challenges, and roads ahead</article-title>. <source>J. Genet. Genomics</source> <volume>49</volume> (<issue>9</issue>), <fpage>833</fpage>&#x2013;<lpage>846</lpage>. <pub-id pub-id-type="doi">10.1016/j.jgg.2022.06.004</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Melnikova</surname>
<given-names>N. V.</given-names>
</name>
<name>
<surname>Pushkova</surname>
<given-names>E. N.</given-names>
</name>
<name>
<surname>Dvorianinova</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Beniaminov</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Novakovskiy</surname>
<given-names>R. O.</given-names>
</name>
<name>
<surname>Povkhova</surname>
<given-names>L. V.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Genome assembly and sex-determining region of male and female Populus &#xd7; sibirica</article-title>. <source>Front. Plant Sci.</source> <volume>12</volume>, <fpage>625416</fpage>. <pub-id pub-id-type="doi">10.3389/fpls.2021.625416</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>More</surname>
<given-names>A. P.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Flax fiber&#x2013;based polymer composites: a review</article-title>. <source>Adv. Compos. Hybrid Mater.</source> <volume>5</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.1007/s42114-021-00246-9</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Muir</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Westcott</surname>
<given-names>N. D.</given-names>
</name>
</person-group> (<year>2003</year>). <source>Flax: the genus Linum</source>. <publisher-loc>Boca Raton, Florida</publisher-loc>: <publisher-name>CRC Press</publisher-name>.</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nag</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mitra</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Karmakar</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>An overview on flax (Linum usitatissimum L.) and its genetic diversity</article-title>. <source>Int. J. Agric. Environ. Biotechnol.</source> <volume>8</volume> (<issue>4</issue>), <fpage>805</fpage>&#x2013;<lpage>817</lpage>. <pub-id pub-id-type="doi">10.5958/2230-732x.2015.00089.3</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>N&#xfc;tzmann</surname>
<given-names>H.-W.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Osbourn</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Plant metabolic clusters &#x2013; from genetics to genomics</article-title>. <source>New Phytol.</source> <volume>211</volume> (<issue>3</issue>), <fpage>771</fpage>&#x2013;<lpage>789</lpage>. <pub-id pub-id-type="doi">10.1111/nph.13981</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ou</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>LTR_retriever: a highly accurate and sensitive program for identification of long terminal repeat retrotransposons</article-title>. <source>Plant physiol.</source> <volume>176</volume> (<issue>2</issue>), <fpage>1410</fpage>&#x2013;<lpage>1422</lpage>. <pub-id pub-id-type="doi">10.1104/pp.17.01310</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Petereit</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bayer</surname>
<given-names>P. E.</given-names>
</name>
<name>
<surname>Thomas</surname>
<given-names>W. J. W.</given-names>
</name>
<name>
<surname>Tay Fernandez</surname>
<given-names>C. G.</given-names>
</name>
<name>
<surname>Amas</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Pangenomics and crop genome adaptation in a changing climate</article-title>. <source>Plants</source> <volume>11</volume> (<issue>15</issue>), <fpage>1949</fpage>. <pub-id pub-id-type="doi">10.3390/plants11151949</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sa</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Siqin</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>An</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bao</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Chromosome-level genome assembly and annotation of the fiber flax (Linum usitatissimum) genome</article-title>. <source>Front. Genet.</source> <volume>12</volume>, <fpage>735690</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2021.735690</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salem</surname>
<given-names>M. O. A.</given-names>
</name>
<name>
<surname>Ta&#x15f;tan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Bilen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Terzi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>S&#xf6;nmez</surname>
<given-names>A. Y.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Dietary flaxseed (Linum usitatissimum) oil supplementation affects growth, oxidative stress, immune response, and diseases resistance in rainbow trout (<italic>Oncorhynchus mykiss</italic>)</article-title>. <source>Fish Shellfish Immunol.</source> <volume>138</volume>, <fpage>108798</fpage>. <pub-id pub-id-type="doi">10.1016/j.fsi.2023.108798</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sedeek</surname>
<given-names>K. E. M.</given-names>
</name>
<name>
<surname>Mahas</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mahfouz</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Plant genome engineering for targeted improvement of crop traits</article-title>. <source>Front. Plant Sci.</source> <volume>10</volume>, <fpage>114</fpage>. <pub-id pub-id-type="doi">10.3389/fpls.2019.00114</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sereika</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kirkegaard</surname>
<given-names>R. H.</given-names>
</name>
<name>
<surname>Karst</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Michaelsen</surname>
<given-names>T. Y.</given-names>
</name>
<name>
<surname>S&#xf8;rensen</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Wollenberg</surname>
<given-names>R. D.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Oxford Nanopore R10.4 long-read sequencing enables the generation of near-finished bacterial genomes from pure cultures and metagenomes without short-read or reference polishing</article-title>. <source>Nat. Methods</source> <volume>19</volume> (<issue>7</issue>), <fpage>823</fpage>&#x2013;<lpage>826</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-022-01539-7</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sim&#xe3;o</surname>
<given-names>F. A.</given-names>
</name>
<name>
<surname>Waterhouse</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Ioannidis</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kriventseva</surname>
<given-names>E. V.</given-names>
</name>
<name>
<surname>Zdobnov</surname>
<given-names>E. M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>BUSCO: assessing genome assembly and annotation completeness with single-copy orthologs</article-title>. <source>Bioinformatics</source> <volume>31</volume> (<issue>19</issue>), <fpage>3210</fpage>&#x2013;<lpage>3212</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv351</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singh</surname>
<given-names>K. S.</given-names>
</name>
<name>
<surname>van der Hooft</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>van Wees</surname>
<given-names>S. C.</given-names>
</name>
<name>
<surname>Medema</surname>
<given-names>M. H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Integrative omics approaches for biosynthetic pathway discovery in plants</article-title>. <source>Nat. Product. Rep.</source> <volume>39</volume> (<issue>9</issue>), <fpage>1876</fpage>&#x2013;<lpage>1896</lpage>. <pub-id pub-id-type="doi">10.1039/d2np00032f</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sirotkin</surname>
<given-names>A. V.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Influence of flaxseed (Linum usitatissimum) on female reproduction</article-title>. <source>Planta Medica</source> <volume>89</volume>, <fpage>608</fpage>&#x2013;<lpage>615</lpage>. <pub-id pub-id-type="doi">10.1055/a-2013-2966</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname>
<given-names>J.-M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Z.-W.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Oil plant genomes: current state of the science</article-title>. <source>J. Exp. Bot.</source> <volume>73</volume> (<issue>9</issue>), <fpage>2859</fpage>&#x2013;<lpage>2874</lpage>. <pub-id pub-id-type="doi">10.1093/jxb/erab472</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Q.-H.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Twenty years of plant genome sequencing: achievements and challenges</article-title>. <source>Trends Plant Sci.</source> <volume>27</volume>, <fpage>391</fpage>&#x2013;<lpage>401</lpage>. <pub-id pub-id-type="doi">10.1016/j.tplants.2021.10.006</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Tello-Ruiz</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Jaiswal</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ware</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2022</year>). &#x201c;<article-title>Gramene: a resource for comparative analysis of plants genomes and pathways</article-title>,&#x201d; in <source>Plant bioinformatics: methods and protocols</source> (<publisher-loc>Berlin, Germany</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>101</fpage>&#x2013;<lpage>131</lpage>.</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van der Werf</surname>
<given-names>H. M.</given-names>
</name>
<name>
<surname>Turunen</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>The environmental impacts of the production of hemp and flax textile yarn</article-title>. <source>Industrial Crops Prod.</source> <volume>27</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1016/j.indcrop.2007.05.003</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vaser</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Sovi&#x107;</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Nagarajan</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>&#x160;iki&#x107;</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Fast and accurate <italic>de novo</italic> genome assembly from long uncorrected reads</article-title>. <source>Genome Res.</source> <volume>27</volume> (<issue>5</issue>), <fpage>737</fpage>&#x2013;<lpage>746</lpage>. <pub-id pub-id-type="doi">10.1101/gr.214270.116</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Cimen</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Buckler</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Deep learning for plant genomics and crop improvement</article-title>. <source>Curr. Opin. Plant Biol.</source> <volume>54</volume>, <fpage>34</fpage>&#x2013;<lpage>41</lpage>. <pub-id pub-id-type="doi">10.1016/j.pbi.2019.12.010</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Padua</surname>
<given-names>G. W.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Properties of zein films coated with drying oils</article-title>. <source>J. Agric. Food Chem.</source> <volume>53</volume> (<issue>9</issue>), <fpage>3444</fpage>&#x2013;<lpage>3448</lpage>. <pub-id pub-id-type="doi">10.1021/jf047994n</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Coombe</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Nikoli&#x107;</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Nip</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Sidhu</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Linear time complexity <italic>de novo</italic> long read genome assembly with GoldRush</article-title>. <source>Nat. Commun.</source> <volume>14</volume> (<issue>1</issue>), <fpage>2906</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-023-38716-x</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>You</surname>
<given-names>F. M.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Jia</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Chromosome&#x2010;scale pseudomolecules refined by optical, physical and genetic maps in flax</article-title>. <source>Plant J.</source> <volume>95</volume> (<issue>2</issue>), <fpage>371</fpage>&#x2013;<lpage>384</lpage>. <pub-id pub-id-type="doi">10.1111/tpj.13944</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Dang</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Genomic comparison and population diversity analysis provide insights into the domestication and improvement of flax</article-title>. <source>Iscience</source> <volume>23</volume> (<issue>4</issue>), <fpage>100967</fpage>. <pub-id pub-id-type="doi">10.1016/j.isci.2020.100967</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zuo</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>High-quality genome assembly and genome-wide association study of male sterility provide resources for flax improvement</article-title>. <source>Plants</source> <volume>12</volume> (<issue>15</issue>), <fpage>2773</fpage>. <pub-id pub-id-type="doi">10.3390/plants12152773</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Unlocking plant metabolic diversity: a (pan)-genomic view</article-title>. <source>Plant Commun.</source> <volume>3</volume>, <fpage>100300</fpage>. <pub-id pub-id-type="doi">10.1016/j.xplc.2022.100300</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zimin</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Mar&#xe7;ais</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Puiu</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Roberts</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Salzberg</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Yorke</surname>
<given-names>J. A.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>The MaSuRCA genome assembler</article-title>. <source>Bioinformatics</source> <volume>29</volume> (<issue>21</issue>), <fpage>2669</fpage>&#x2013;<lpage>2677</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btt476</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>