<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2016.01883</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Comparative Characterization of the Leaf Tissue of <italic>Physalis alkekengi</italic> and <italic>Physalis peruviana</italic> Using RNA-seq and Metabolite Profiling</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Fukushima</surname> <given-names>Atsushi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/27844/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Nakamura</surname> <given-names>Michimi</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/232538/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Suzuki</surname> <given-names>Hideyuki</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/46142/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Yamazaki</surname> <given-names>Mami</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/26059/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Knoch</surname> <given-names>Eva</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/142754/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Mori</surname> <given-names>Tetsuya</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Umemoto</surname> <given-names>Naoyuki</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/361403/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Morita</surname> <given-names>Masaki</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/365678/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Hirai</surname> <given-names>Go</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Sodeoka</surname> <given-names>Mikiko</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Saito</surname> <given-names>Kazuki</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/12155/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>RIKEN Center for Sustainable Resource Science</institution> <country>Yokohama, Japan</country></aff>
<aff id="aff2"><sup>2</sup><institution>Graduate School of Pharmaceutical Sciences, Chiba University</institution> <country>Chiba, Japan</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Biotechnology Research, Kazusa DNA Research Institute</institution> <country>Chiba, Japan</country></aff>
<aff id="aff4"><sup>4</sup><institution>Synthetic Organic Chemistry Laboratory, RIKEN</institution> <country>Saitama, Japan</country></aff>
<aff id="aff5"><sup>5</sup><institution>RIKEN Center for Sustainable Resource Science</institution> <country>Saitama, Japan</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: <italic>Xiaowu Wang, Chinese Academy of Agricultural Sciences, China</italic></p></fn>
<fn fn-type="edited-by"><p>Reviewed by: <italic>Erli Pang, Beijing Normal University, China; Zhonghua Zhang, Chinese Academy of Agricultural Sciences, China</italic></p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x002A;Correspondence: <italic>Atsushi Fukushima, <email>atsushi.fukushima@riken.jp</email> Kazuki Saito, <email>kazuki.saito@riken.jp</email></italic></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Plant Genetics and Genomics, a section of the journal Frontiers in Plant Science</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>20</day>
<month>12</month>
<year>2016</year>
</pub-date>
<pub-date pub-type="collection">
<year>2016</year>
</pub-date>
<volume>7</volume>
<elocation-id>1883</elocation-id>
<history>
<date date-type="received">
<day>13</day>
<month>07</month>
<year>2016</year>
</date>
<date date-type="accepted">
<day>29</day>
<month>11</month>
<year>2016</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2016 Fukushima, Nakamura, Suzuki, Yamazaki, Knoch, Mori, Umemoto, Morita, Hirai, Sodeoka and Saito.</copyright-statement>
<copyright-year>2016</copyright-year>
<copyright-holder>Fukushima, Nakamura, Suzuki, Yamazaki, Knoch, Mori, Umemoto, Morita, Hirai, Sodeoka and Saito</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>The genus <italic>Physalis</italic> in the <italic>Solanaceae</italic> family contains several species of benefit to humans. Examples include <italic>P. alkekengi</italic> (Chinese-lantern plant, h&#x00F4;zuki in Japanese) used for medicinal and for decorative purposes, and <italic>P. peruviana</italic>, also known as Cape gooseberry, which bears an edible, vitamin-rich fruit. Members of the <italic>Physalis</italic> genus are a valuable resource for phytochemicals needed for the development of medicines and functional foods. To fully utilize the potential of these phytochemicals we need to understand their biosynthesis, and for this we need genomic data, especially comprehensive transcriptome datasets for gene discovery. We report the <italic>de novo</italic> assembly of the transcriptome from leaves of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> using Illumina RNA-seq technologies. We identified 75,221 unigenes in <italic>P. alkekengi</italic> and 54,513 in <italic>P. peruviana</italic>. All unigenes were annotated with gene ontology (GO), Enzyme Commission (EC) numbers, and pathway information from the Kyoto Encyclopedia of Genes and Genomes (KEGG). We classified unigenes encoding enzyme candidates putatively involved in the secondary metabolism and identified more than one unigenes for each step in terpenoid backbone- and steroid biosynthesis in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>. To measure the variability of the withanolides including physalins and provide insights into their chemical diversity in <italic>Physalis</italic>, we also analyzed the metabolite content in leaves of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> at five different developmental stages by liquid chromatography-mass spectrometry. We discuss that comprehensive transcriptome approaches within a family can yield a clue for gene discovery in <italic>Physalis</italic> and provide insights into their complex chemical diversity. The transcriptome information we submit here will serve as an important public resource for further studies of the specialized metabolism of <italic>Physalis</italic> species.</p>
</abstract>
<kwd-group>
<kwd><italic>Physalis</italic></kwd>
<kwd><italic>de novo</italic> transcriptome assembly</kwd>
<kwd>deep sequencing</kwd>
<kwd>marker development</kwd>
<kwd>secondary metabolism</kwd>
<kwd>physalin</kwd>
<kwd>withanolide</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="51"/>
<page-count count="12"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec><title>Introduction</title>
<p>The specialized or secondary metabolism in plants is an important source for fine chemicals including drugs, dyes, vitamins, and other chemical materials. The genus <italic>Physalis</italic>, the largest genera in the <italic>Solanoideae</italic> subfamily, contains the most economically important genera, e.g., <italic>Solanum tuberosum</italic> (potato), <italic>S. lycopersicum</italic> (tomato), and <italic>Capsicum annuum</italic> (red pepper; <xref ref-type="bibr" rid="B29">Martinez, 1998</xref>). Some plants in approximately 90 species have a long history of cultivation. <italic>P. alkekengi var. franchetii</italic> (Chinese-lantern, h&#x00F4;zuki in Japanese) has been used as a medicinal plant and for decorative purposes. <italic>P. peruviana</italic>, also known as Cape gooseberry, has an edible fruit that contains many vitamins and antioxidants (<xref ref-type="bibr" rid="B36">Ramadan and Morsel, 2003</xref>).</p>
<p>Members of the genus <italic>Physalis</italic> produce bioactive metabolites such as steroidal lactones withanolides (<xref ref-type="bibr" rid="B3">Eich, 2008</xref>). <italic>P. peruviana</italic> can produce withanolides and, <italic>P. alkekengi</italic> physalins, a different subgroup of withanolides. The structures of physalins A and B were first determined in 1969 (<xref ref-type="bibr" rid="B30">Matsuura and Kawai, 1969</xref>; <xref ref-type="bibr" rid="B31">Matsuura et al., 1969</xref>) and subsequently more than 30 physalins were isolated. Studies using spectroscopic methods isolated 3 new- and 7 known steroids including physalins and demonstrated that physalin B exhibited the most significant cytotoxic activities against HeLa human cervical cells (<xref ref-type="bibr" rid="B22">Kawai et al., 2002</xref>; <xref ref-type="bibr" rid="B27">Li et al., 2014</xref>). Physalin B or F inhibited NF-kappa B activation (<xref ref-type="bibr" rid="B20">Jacobo-Herrera et al., 2006</xref>; <xref ref-type="bibr" rid="B46">Wu et al., 2012</xref>) and both right- and left-sided partial structures were proposed to play a significant role in their mode of action (<xref ref-type="bibr" rid="B34">Ozawa et al., 2013</xref>). 4&#x03B2;-Hydroxywithanolide E derived from <italic>P. peruviana</italic> inhibited the growth of a human non-small lung cancer cell line (<xref ref-type="bibr" rid="B50">Yen et al., 2010</xref>).</p>
<p>High-throughput DNA sequencing with a next-generation sequencer (NGS) is useful for genome assembly, the detection of single nucleotide polymorphisms (SNPs) and genetic variations, and for transcriptome characterization (<xref ref-type="bibr" rid="B44">Wang et al., 2009</xref>; <xref ref-type="bibr" rid="B7">Garber et al., 2011</xref>). RNA sequencing (RNA-seq) on NGSs can be used for both model and non-model plants (<xref ref-type="bibr" rid="B9">Gongora-Castillo and Buell, 2013</xref>; <xref ref-type="bibr" rid="B5">Fukushima and Kusano, 2014</xref>; <xref ref-type="bibr" rid="B45">Weber, 2015</xref>). Successful transcriptome studies on non-model plants, e.g., crop plants such as the eggplant (<xref ref-type="bibr" rid="B38">Ramesh et al., 2016</xref>), pepper (<xref ref-type="bibr" rid="B12">Gordo et al., 2012</xref>) and tobacco (<xref ref-type="bibr" rid="B25">Lei et al., 2014</xref>) and medicinal plants, e.g., <italic>Withania somnifera</italic> (<xref ref-type="bibr" rid="B16">Gupta et al., 2013</xref>; <xref ref-type="bibr" rid="B39">Senthil et al., 2015</xref>) and <italic>P. peruviana</italic> (<xref ref-type="bibr" rid="B8">Garzon-Martinez et al., 2012</xref>) from the <italic>Solanaceae</italic> family have been published. Resources for transcriptome data from medicinal plants, e.g., the Medicinal Plant Genomics Resource (MPGR<sup><xref ref-type="fn" rid="fn01">1</xref></sup>) and the Medicinal Plants Transcriptomics (Medplants<sup><xref ref-type="fn" rid="fn02">2</xref></sup>; <xref ref-type="bibr" rid="B10">Gongora-Castillo et al., 2012a</xref>,<xref ref-type="bibr" rid="B11">b</xref>; <xref ref-type="bibr" rid="B51">Yeo et al., 2013</xref>) are available. To take full advantage of the potential of important phytochemicals we need to elucidate their biosynthesis. For this we need genomic data, especially comprehensive transcriptome datasets for gene discovery.</p>
<p>Our main aim of this study is to describe the whole transcriptome map of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> leaves and to inventory the basic information about a wide range of the metabolism including the withanolide biosynthesis pathway in leaves (<bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold>). Here we present a <italic>de novo</italic> assembly transcriptome from the leaves of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>. We employed Illumina RNA-seq techniques and demonstrate that these resources can provide the means for a better understanding of chemical diversity in <italic>Physalis</italic> species. We annotated the assembled unigenes in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> and classified unigenes encoding enzyme candidates putatively involved in secondary metabolism. Our approaches provide a basis for future researches on bio-engineering of <italic>Physalis</italic> plants and they represent a shortcut to gene discovery in these species.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p><bold>Possible pathways of withanolide biosynthesis.</bold> Our main aim of this study is to describe the whole transcriptome map of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> leaves and to inventory the basic information about a wide range of the metabolism including the withanolide biosynthesis pathway in leaf tissues. Although the assembled unigenes are hypothetic/proposed candidate genes, comparative transcriptome analysis using other <italic>Physalis</italic> species is a promising way to study and identify species-specific and evolutionary conserved pathways involved in highly complex biosynthesis of withanolides like physalin. Single black arrows show one step, two or more gray arrows show multiple unknown steps. Abbreviation: IPP, isopentenyl pyrophosphate; DMAPP, dimethylallyl pyrophosphate; GPP, geranyl pyrophosphate; FPP, farnesyl pyrophosphate; and SQ, squalene. Enzyme abbreviation: (1) Geranyl diphosphate Synthase (GPPS, EC 2.5.1.1); (2) Farnesyl diphosphate Synthase (FPPS, EC 2.5.1.10); (3), Squalene Synthase (SQS, EC 2.5.1.21); (4) Cycloartenol Synthase (CAS, EC 5.4.99.8); (5) Cycloartenol C-24 methyltransferase (SMT1, EC 2.1.1.41); (6) Sterol-4a-methyl oxidase (SMO, EC 1 1.14.13.72); (7) Cycloeucalenol cycloisomerase (CECI, EC 5.5.1.9); (8) obtusifoliol 14-demethylase (CYP51G1, EC 1.14.13.70); (9) D14-sterol reductase (FK, EC 1.3.1.70); (10) C-7,8 sterol isomerase (HYDI, EC 5.3.3.5); (11) Sterol-4a-methyl oxidase 2 (SMO2, EC 1.14.13.72); (12) C-5 sterol desaturase (STE1, EC 1.14.21.6); and (13) Sterol &#x0394;7 reductase (DWF5, EC 1.3.1.21).</p></caption>
<graphic xlink:href="fpls-07-01883-g001.tif"/>
</fig>
</sec>
<sec id="s1" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec><title>Plant Materials, RNA Isolation, and cDNA Synthesis</title>
<p><italic>Physalis alkekengi var. franchetii</italic> and <italic>P. peruviana</italic> (Ground Cherry or Golden Berry) plants were grown in the experimental gardens of the RIKEN Center for Sustainable Resource Science, Wako, Saitama, Japan. They are not an endangered or protected species. The third fresh leaves were collected from healthy plants (<bold>Supplementary Image <xref ref-type="supplementary-material" rid="SM1">1</xref></bold>). RNA isolation and cDNA synthesis for sequencing were carried out as previously reported (<xref ref-type="bibr" rid="B6">Fukushima et al., 2015</xref>; <xref ref-type="bibr" rid="B17">Han et al., 2015a</xref>,<xref ref-type="bibr" rid="B18">b</xref>). We used unreplicated data for one sample per species.</p>
</sec>
<sec><title>Illumina Sequencing</title>
<p>For the generation of cDNA libraries we employed an Illumina HiSeq 2000 sequencer (Illumina Inc., San Diego, CA, USA). We sequenced 100-bp paired-end (PE) reads as described (<xref ref-type="bibr" rid="B6">Fukushima et al., 2015</xref>; <xref ref-type="bibr" rid="B17">Han et al., 2015a</xref>,<xref ref-type="bibr" rid="B18">b</xref>). Our short-read data in FASTQ file format were produced by Casava 1.8 (Illumina, Inc. San Diego, CA, USA). Short reads that did not pass Illumina&#x2019;s standard quality filter were eliminated. The process yielded clean reads from the mRNA pool isolated from <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>, respectively (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold>).</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Summary of sequencing and assembly results after Illumina sequencing of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Species</th>
<th valign="top" align="left"><italic>P. alkekengi</italic></th>
<th valign="top" align="left"><italic>P. peruviana</italic></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Sequencing results</td>
<td valign="top" align="left"></td>
<td valign="top" align="left"></td>
</tr>
<tr>
<td valign="top" align="left">Total length of clean reads (bp)</td>
<td valign="top" align="left">2,540,006,580</td>
<td valign="top" align="left">2,345,503,406</td>
</tr>
<tr>
<td valign="top" align="left">G + C%</td>
<td valign="top" align="left">43.1</td>
<td valign="top" align="left">43.4</td>
</tr>
<tr>
<td valign="top" align="left" colspan="2">Assembly results (unigenes)</td>
<td valign="top" align="left"></td>
</tr>
<tr>
<td valign="top" align="left">Number</td>
<td valign="top" align="left">75,221</td>
<td valign="top" align="left">54,513</td>
</tr>
<tr>
<td valign="top" align="left">Average length (bp)</td>
<td valign="top" align="left">867</td>
<td valign="top" align="left">930</td>
</tr>
<tr>
<td valign="top" align="left">Maximum length (bp)</td>
<td valign="top" align="left">14,564</td>
<td valign="top" align="left">12,329</td>
</tr>
<tr>
<td valign="top" align="left">Minimum length (bp)</td>
<td valign="top" align="left">201</td>
<td valign="top" align="left">201</td>
</tr>
<tr>
<td valign="top" align="left">N50 (bp)</td>
<td valign="top" align="left">1,550</td>
<td valign="top" align="left">1,636</td>
</tr>
<tr>
<td valign="top" align="left">G + C%</td>
<td valign="top" align="left">39.8</td>
<td valign="top" align="left">40.5</td></tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec><title>Data Pre-processing and <italic>De novo</italic> Transcriptome Assembly</title>
<p>We performed <italic>de novo</italic> transcriptome assembly using the Trinity program (<xref ref-type="bibr" rid="B14">Grabherr et al., 2011</xref>). We then subjected the assembled unigenes to read alignment and transcript abundance estimation with Bowtie (<xref ref-type="bibr" rid="B24">Langmead et al., 2009</xref>) and RSEM (<xref ref-type="bibr" rid="B26">Li and Dewey, 2011</xref>). To estimate transcript abundance we used the Fragments Per Kilobase of exon per Million mapped fragments (FPKM) method. We identified 75,221 unigenes in <italic>P. alkekengi</italic> and 54,513 unigenes in <italic>P. peruviana</italic>. The length and G + C% distribution of all unigenes are shown in <bold>Figures <xref ref-type="fig" rid="F2">2A,B</xref></bold>. The G + C% and basic statistics were calculated with the custom Ruby/Bioruby script (<xref ref-type="bibr" rid="B13">Goto et al., 2010</xref>), &#x201C;Biostrings&#x201D; (<xref ref-type="bibr" rid="B35">Pages et al., 2009</xref>), and the R/Bioconductor package &#x201C;ShortRead&#x201D; (<xref ref-type="bibr" rid="B32">Morgan et al., 2009</xref>). For quality control we used the FASTX-Toolkit <sup><xref ref-type="fn" rid="fn03">3</xref></sup> and the FastQC package<sup><xref ref-type="fn" rid="fn04">4</xref></sup>. Default settings were used in all calculations in this section.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p><bold>Overview of the <italic>de novo</italic> transcriptome assembly in <italic>P. alkekengi</italic> (A)</bold> and <italic>P. peruviana</italic> <bold>(B)</bold>. Length and G + C% distribution of unigenes assembled from high-quality clean reads by the Trinity program (<xref ref-type="bibr" rid="B14">Grabherr et al., 2011</xref>).</p></caption>
<graphic xlink:href="fpls-07-01883-g002.tif"/>
</fig>
</sec>
<sec><title>Functional Annotation and Classification of Unigenes</title>
<p>We performed functional annotation of all unigenes with a BLASTx search (<xref ref-type="bibr" rid="B1">Altschul et al., 1990</xref>) against the NCBI NR database<sup><xref ref-type="fn" rid="fn05">5</xref></sup> (formatted on April 7, 2014); our cutoff <italic>E</italic>-value was &#x003C;1<italic>E</italic>-5. We applied the Blast2GO program v 2.7.1 (<xref ref-type="bibr" rid="B2">Conesa et al., 2005</xref>) to assign GO categories, an EC number, and KEGG pathways (<xref ref-type="bibr" rid="B21">Kanehisa et al., 2014</xref>) based on the BLAST results with default settings. Visualization of the GO functional category of all unigenes and of the distribution of gene functions in the different species was with the BGI WEGO program (<xref ref-type="bibr" rid="B49">Ye et al., 2006</xref>). We identified microsatellites in the unigenes using the microsatellite identification tool (MISA)<sup><xref ref-type="fn" rid="fn06">6</xref></sup> (<xref ref-type="bibr" rid="B42">Thiel et al., 2003</xref>). The default parameters (unit size-minimum repeats: 1-10, 2-6, 3-5, 4-5, 5-5, and 6-5) were used.</p>
</sec>
<sec><title>Authentic Samples and Extraction of Withanolides and LC-QTOF-MS Analysis</title>
<p>The authentic samples of withanolides were isolated from plants as described in our previous paper (<xref ref-type="bibr" rid="B34">Ozawa et al., 2013</xref>). The leaves of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> were collected at five different developmental stages of the growing season before bearing fruit, because our pilot study showed to detect withanolides of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> at these stages (data not shown). Fresh samples of leaves at five different developmental stages were extracted with 5 &#x03BC;l of 80% MeOH containing 2.5 &#x03BC;M lidocaine (internal standard) per mg fresh weight using a mixer mill with zirconia beads (7 min at 18 Hz and 4&#x00B0;C). After 10-min centrifugation, the supernatant was filtered using an HLB &#x03BC;Elution plate (Waters). The extracts (1 &#x03BC;l) were analyzed with LC-QTOF-MS (LC, Waters Acquity UPLC system; MS, Waters Xevo G2 Q-Tof). The analytical conditions for metabolite profiling were as described in elsewhere (<xref ref-type="bibr" rid="B40">Tamura et al., 2014</xref>). The polarity of electrospray ionization was applied in positive ionization mode.</p>
</sec>
</sec>
<sec><title>Results and Discussion</title>
<sec><title>Sample Preparation, Illumina Sequencing, and <italic>De novo</italic> Transcriptome Assembly</title>
<p>For the transcriptome analysis of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>, total RNA samples were isolated from leaves (<bold>Supplementary Image <xref ref-type="supplementary-material" rid="SM1">1</xref></bold>). We performed DNase treatment and confirmed RNA integrity using a bioanalyzer (see Materials and Methods). Total RNA was used in mRNA preparation, fragmentation, and cDNA synthesis. Illumina sequencing produced clean reads (in total 2,540,006,580 bp and 2,345,503,406 bp) from the mRNA pool isolated from <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>, respectively (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold>). The short reads exhibited mean quality scores of 35.0 in <italic>P. alkekengi</italic> and 34.9 in <italic>P. peruviana</italic>, confirming that our sequencing was sufficient for <italic>de novo</italic> assembly. After the removal of adaptor-, ambiguous- and low-quality reads, we assembled all clean reads into unigenes using the Trinity program (<xref ref-type="bibr" rid="B14">Grabherr et al., 2011</xref>). There were 75,221 and 54,513 total transcripts in leaves of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>, respectively. The unigenes in <italic>P. alkekengi</italic> had an average length of 867 basepairs (bp) and an N50 of 1,550 bp; in <italic>P. peruviana</italic> the average length was 930 and 1,636 bp (N50). The length and the G + C% distribution for all unigenes in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> are shown in <bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>. In total, 39,709 unigenes were less than 500 bp in length. In <italic>P. alkekengi</italic> 2,732 unigenes were longer than 3,000 bp. In <italic>P. peruviana</italic> 26,991 unigenes were less than 500 bp and 2,283 were longer than 3,000 bp (Supplementary Data Sheet <xref ref-type="supplementary-material" rid="SM3">1</xref>). The average G + C content of unigenes in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> was 39.8 and 40.5%, respectively. The G + C content in <italic>P. peruviana</italic> is consistent with what has been reported previously (<xref ref-type="bibr" rid="B8">Garzon-Martinez et al., 2012</xref>).</p>
</sec>
<sec><title>Functional Annotation of <italic>Physalis</italic> Unigenes</title>
<p>To assess and annotate the assembled unigenes, we performed a sequence homology search against the GenBank non-redundant (NR) database using BLASTx (<italic>E</italic>-value &#x003C; 1<italic>E</italic>-5; <xref ref-type="bibr" rid="B1">Altschul et al., 1990</xref>). We found that 40,090 and 33,183 unigene sequences in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>, respectively, had BLAST hits to annotated sequences in the NR database (<bold>Figure <xref ref-type="fig" rid="F3">3</xref></bold>). Further analysis of the similarity distributions showed that 72.5 and 74.7% of matched sequences in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>, respectively, manifested alignment identities greater than 80%. For <italic>P. alkekengi</italic> a large number of the best/top-hits matched the sequences of <italic>S. tuberosum</italic> (61.5%) and <italic>S. lycopersicum</italic> (26.3%); other hits were detected within the reference protein databases of <italic>Vitis vinifera</italic> (1.5%) and <italic>S. demissum</italic> (1.2%; <bold>Figure <xref ref-type="fig" rid="F3">3A</xref></bold>). The <italic>P. peruviana</italic> transcriptome showed that the hits matched the sequences of <italic>S. tuberosum</italic> (61.8%) and <italic>S. lycopersicum</italic> (27.4%); other hits were detected within the reference protein databases of <italic>V. vinifera</italic> (1.2%) and <italic>Nicotiana tabacum</italic> (1.0%; <bold>Figure <xref ref-type="fig" rid="F3">3B</xref></bold>). These observations indicate that the distribution of the top BLAST hits for the obtained unigenes from two different <italic>Physalis</italic> species was similar. Unigenes with no BLAST hits may imply the presence of additional genes that do not exist in the annotated sequence databases or of sequences too short for BLAST hits.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p><bold>Characterization of the assembled unigenes based on a non-redundant (NR) protein database search in <italic>Physalis</italic>. (A)</bold> Top-hit species- and <italic>E</italic>-value-distributions of <italic>P. alkekengi</italic>. The <italic>E</italic>-value distribution of BLAST hits for the assembled unigenes with a cutoff of <italic>E</italic>-value &#x003C; 1<italic>E</italic>-5. <bold>(B)</bold> Top-hit species- and <italic>E</italic>-value-distributions of <italic>P. peruviana</italic>. Top-hit distribution was calculated based on only the best/top sequence alignment with the lowest <italic>E</italic>-value for our BLAST result.</p></caption>
<graphic xlink:href="fpls-07-01883-g003.tif"/>
</fig>
<p>The gene ontology (GO), classification of standardized gene functions, is useful for annotating gene functions and gene products in any organism. GO contains three main independent categories: cellular component, molecular function, and biological process (<xref ref-type="bibr" rid="B41">The Gene Ontology Consortium, 2014</xref>). We used Blast2GO software (<xref ref-type="bibr" rid="B2">Conesa et al., 2005</xref>) to analyze the GO functional categories of the assembled unigenes and then applied WEGO program (<xref ref-type="bibr" rid="B49">Ye et al., 2006</xref>) to visualize the results of GO functional classifications. WEGO maps all annotated unigenes to GO categories and detect the number of unigenes associated with each GO category. Based on NR annotation, 30,689 and 25,751 unigenes in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>, respectively, were assigned to three main categories (<bold>Figure <xref ref-type="fig" rid="F4">4</xref></bold>). Further analysis of the GO categories showed that the dominant categories were &#x201C;cell,&#x201D; &#x201C;cell part,&#x201D; &#x201C;binding,&#x201D; &#x201C;catalytic,&#x201D; &#x201C;metabolic process,&#x201D; and &#x201C;cellular process&#x201D; (black arrows in <bold>Figure <xref ref-type="fig" rid="F4">4</xref></bold>). We observed that within the biological process group, most unigenes were putatively involved in &#x201C;cellular process&#x201D; and &#x201C;metabolic process.&#x201D; Most unigenes were assigned to the GO categories &#x201C;binding&#x201D; and &#x201C;catalytic activity&#x201D; in the molecular function group, and to &#x201C;cells&#x201D; and &#x201C;cell parts&#x201D; in the cellular component. Please note that these observation depends on the layer of the GO categories.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p><bold>GO assignments for all assembled unigenes in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>.</bold> The results are summarized in sets of three functional categories: cellular component, molecular function, and biological process. 30,689 and 25,751 unigenes from <italic>P. alkekengi</italic> (magenta) and <italic>P. peruviana</italic> (cyan), respectively, were categorized by GO categories. The GO categories were displayed using WEGO (<ext-link ext-link-type="uri" xlink:href="http://wego.genomics.org.cn">http://wego.genomics.org.cn</ext-link>; <xref ref-type="bibr" rid="B49">Ye et al., 2006</xref>).</p></caption>
<graphic xlink:href="fpls-07-01883-g004.tif"/>
</fig>
<p>KEGG (<xref ref-type="bibr" rid="B21">Kanehisa et al., 2014</xref>) is a database resource for various levels of molecules in biological systems. It provides useful information for exploring the functional characteristics of genes. To further elucidate the function of the <italic>Physalis</italic> transcriptomes, the unigenes were annotated by the KEGG pathway. A total of 3,819 and 3,669 unigenes in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> was assigned into 134 and 139 KEGG pathways, respectively (<bold>Figure <xref ref-type="fig" rid="F5">5</xref></bold> and Supplementary Data Sheet <xref ref-type="supplementary-material" rid="SM4">2</xref>). The top-five ranking pathways in <italic>P. alkekengi</italic> were purine- (683 unigenes), starch and sucrose- (344 unigenes), thiamine- (258 unigenes), pyrimidine- (244 unigenes), and glycerolipid metabolism (190 unigenes). The top-five ranking pathways in <italic>P. peruviana</italic> were similar to <italic>P. alkekengi</italic> except for glycolysis/gluconeogenesis (178 unigenes in <italic>P. peruviana</italic>; Supplementary Data Sheet <xref ref-type="supplementary-material" rid="SM4">2</xref>). These results agree with a previous study that performed the <italic>P. peruviana</italic> leaf transcriptome (<xref ref-type="bibr" rid="B8">Garzon-Martinez et al., 2012</xref>). In addition, we observed a higher number of the classified unigenes putatively involved in starch and sucrose- and glycolysis metabolism in <italic>P. peruviana</italic> than that of <italic>P. alkekengi</italic>. Such gene diversity derived from genomic architecture may reflect different source-to-sink balance between the both species, causing different photosynthetic rate and the carbon partitioning and allocation [for example, see (<xref ref-type="bibr" rid="B33">Osorio et al., 2014</xref>)]. This analysis implies that the pathway-based approach (see reviews by <xref ref-type="bibr" rid="B37">Ramanan et al., 2012</xref>; <xref ref-type="bibr" rid="B4">Fukushima et al., 2014</xref>) is useful for a better understanding of biological functions, gene interactions, and specific processes in <italic>Physalis</italic> species.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p><bold>Pathway enrichment analysis of assembled unigenes in <italic>Physalis</italic>.</bold> Annotated unigenes were classified into 134 and 139 KEGG pathways in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>, respectively. The top 20 pathways including unigenes in <italic>P. alkekengi</italic> and the corresponding pathways in <italic>P. peruviana</italic> are displayed.</p></caption>
<graphic xlink:href="fpls-07-01883-g005.tif"/>
</fig>
</sec>
<sec><title>Candidate Gene Families Associated with Withanolide Biosynthesis</title>
<p>To visualize diversity in secondary metabolism, we classified unigenes into gene families (Supplementary Data Sheet <xref ref-type="supplementary-material" rid="SM4">2C</xref>). The resultant table shows unigenes encoding enzyme candidates putatively involved in the biosynthesis of secondary metabolites such as alkaloids, terpenoids, steroids, and flavonoids. For terpenoid backbone- and steroid biosynthesis we identified more than one unigene for each step in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>. For example, unigenes encoding enzyme candidates putatively involved in the biosynthesis of 24-methylene cholesterol from isopentenyl pyrophosphate (IPP) and dimethylallyl pyrophosphate (DMAPP) [the synthesis requires 13 reaction steps (<xref ref-type="bibr" rid="B16">Gupta et al., 2013</xref>, <xref ref-type="bibr" rid="B15">2015</xref>)] contained &#x0394;7 desaturase (EC:1.14.21.6), 24-C-methyltrasferase (EC:2.1.1.41), squalene epoxidase (EC: 1.14.13.132&#x2192;1.14.14.17), squalene synthase (EC: 2.5.1.21), cholestenol delta-isomerase (EC: 5.3.3.5), and sterol &#x0394;7-reductase (EC:1.3.1.21). Sterol &#x0394;7-reductase catalyzes the biosynthesis of 24-methylene cholesterol, a central precursor in withanolide biosynthesis (<xref ref-type="bibr" rid="B28">Lockley et al., 1976</xref>). Gupta et al. demonstrated that silencing of sterol &#x0394;7-reductase in <italic>W. somnifera</italic> elicited a reduction in the level of the major withanolide withaferin A in leaves (<xref ref-type="bibr" rid="B15">Gupta et al., 2015</xref>).</p>
<p>The specific withanolide contents in leaves of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> at different stages of the leaf development remain largely unknown. To monitor the variability of the withanolides including physalins and provide insights into the chemical diversity of <italic>Physalis</italic>, we analyzed the metabolite content in leaves of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> at five different developmental stages by liquid chromatography-quadrupole time-of-flight-mass spectrometry (LC-QTOF-MS), focusing on six withanolide metabolites, i.e., physalin B, D, F, withanolide E and F, and perulactone B (<bold>Supplementary Image <xref ref-type="supplementary-material" rid="SM2">2</xref></bold>). We found that <italic>P. alkekengi</italic> produced high levels of physalin B, D, and F. In <italic>P. peruviana</italic> we only detected withanolide E and F, and perulactone B (<bold>Figure <xref ref-type="fig" rid="F6">6</xref></bold>). Low levels of withanolide E, F, and perulactone B in <italic>P. peruviana</italic> were observed at the early developmental stages, while the highest levels of withanolide E and F were detected in the young leaves at day 65 (<italic>t</italic>-test, <italic>p</italic> &#x003C; 0.01). A possible explanation for the difference in metabolite levels could be that there are sequence diversity in candidate genes putatively involved in various secondary transformations, including hydroxylation, glycosylation, methylation, and oxidation/reduction, to produce species-specific and development-specific withanolides from 24-methylene cholesterol as a substrate.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p><bold>Measurement of six withanolides of the leaves from <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>.</bold> Different developmental stages and leaf ages were used for comparison between <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>. The analysis was performed with 3&#x2013;6 biological replicates for each tissue/leaf age. An error bar indicates standard deviation. The authentic compounds used in this analysis were chemically synthesized as described in our previous paper (<xref ref-type="bibr" rid="B34">Ozawa et al., 2013</xref>). The limit of detection of each sample was 0.011923 (<italic>P. alkekengi</italic>, d15_Young), 0.010910 (<italic>P. alkekengi</italic>, d20_Mature), 0.013556 (<italic>P. alkekengi</italic>, d22_Mid), 0.010820 (<italic>P. alkekengi</italic>, d27_Mature), 0.010884 (<italic>P. alkekengi</italic>, d30_Mid), 0.012211 (<italic>P. peruviana</italic>, d15_Mature), 0.012456 (<italic>P. peruviana</italic>, d22_Mature), 0.012366 (<italic>P. peruviana</italic>, d29_Mature), 0.014794 (<italic>P. peruviana</italic>, d65_Young), and 0.013141 (<italic>P. peruviana</italic>, d65_Mature). Asterisks represent statistically significant differences from the sample of the youngest stage (i.e., d29_Mature for perulactone B and d15_Mature for withanolide E and F; <italic>t</italic>-test, <sup>&#x2217;</sup> <italic>p</italic> &#x003C; 0.05 and <sup>&#x2217;&#x2217;</sup> <italic>p</italic> &#x003C; 0.01). Abbreviation: d, day; Mid, middle; and ND, not detected.</p></caption>
<graphic xlink:href="fpls-07-01883-g006.tif"/>
</fig>
<p>To further narrow down the candidate genes responsible for the biosynthesis of withanolides, we sought to identify unigenes that are uniquely expressed in either species. Such unigenes may play important roles in the difference of metabolic phenotypes. To this end we performed reciprocal best-hit BLAST search to identify homologous unigenes in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> with BLASTn (<italic>E</italic>-value &#x003C; 1<italic>E</italic>-14) resulting in 25,670 homologous unigenes. Of these unigenes, we identified unigenes expressed uniquely in either of these species (Supplementary Data Sheet <xref ref-type="supplementary-material" rid="SM5">3</xref>). We uncovered 234 unigenes that are exclusive to <italic>P. alkekengi</italic> (FPKM > 1). Of these, a cytochrome p450 chloroplastic-like protein (unigene-ID: c13295_g2_i2) and oxidoreductase-like protein (c16207_g5_i1), are possible candidate genes for the oxidations at the C-15 and C-18 positions of the steroid backbone required in the synthesis of physalis (<bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold>). In contrast, 355 unigenes found in <italic>P. peruviana</italic> were identified through this approach. There were unigenes encoding sterol reductase (c27112_g1_i1), methyltransferase family proteins, and transcription factors like MYB as candidates of specialized metabolites that are likely produced in <italic>P. peruviana</italic>. We had expected some obvious, differentially expressed candidates from the comparative transcriptomics, as was reported by (<xref ref-type="bibr" rid="B48">Yamazaki et al., 2008</xref>). However, the list of genes expressed exclusively in either <italic>P. alkekengi</italic> or <italic>P. peruviana</italic> provided only few candidates. The transcriptomes of both <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> contain many cytochrome p450 monooxygenases and dioxygenases that could be modify both withanolides and physalins. However, none of these stand out as predominant in either <italic>Physalis</italic> species. We expect the biosynthesis of physalins to include cleavage of the C13-C14 bond as well as crosslinking between C14 and C27. Currently we have no good candidate enzymes for these reactions. Cleavage of the C13-C14 bond may occur through Grob fragmentation by an oxidosqualene cyclase type enzyme as described by <xref ref-type="bibr" rid="B47">Xiong et al. (2006)</xref>.</p>
<p>Although there was no convincing evidence for significant changes in gene expressions encoding any of the key enzymes, we were able to provide a set of the hypothetical candidate genes involved in the pathways. We also recognize the limitation of our metabolite analysis in all its quantitative aspects, and that further assessment of the integration of our transcriptome data with wider metabolite profile is needed, but the findings presented here can provide a relevant resource for future study in <italic>Physalis</italic>. Our transcriptome dataset can be used for the identification of genes that contribute to the diversification in <italic>Physalis</italic> species-specific secondary metabolism, such as glycosyltransferases, methyltransferases, and cytochrome P450s.</p>
</sec>
<sec><title>Identification and Comparison of Single Sequence Repeat (SSR) Markers</title>
<p>Single sequence repeats SSRs are microsatellites, repetitive DNA sequences in eukaryotes. They are useful markers in population genetics research, genetic map construction, and genetic diversity assessment (for example, see reviews <xref ref-type="bibr" rid="B19">Hancock, 1996</xref>; <xref ref-type="bibr" rid="B43">Varshney et al., 2005</xref>). To detect and compare SSRs in the two different <italic>Physalis</italic> species we performed <italic>in silico</italic> SSR marker identification with MISA (<xref ref-type="bibr" rid="B42">Thiel et al., 2003</xref>). We identified 11,415 SSRs in 75,221 transcripts of <italic>P. alkekengi</italic> and 12,180 SSRs in <italic>P. peruviana</italic> (<bold>Table <xref ref-type="table" rid="T2">2</xref></bold> and Supplementary Data Sheet <xref ref-type="supplementary-material" rid="SM6">4</xref>). All SSRs can be classified by their repeat-unit sizes. Mono-nucleotide SSRs represented the largest portion (60.9%) of identified SSRs, followed by tri-nucleotide- (19.8%) and di-nucleotide (18.2%) SSRs. Although only a small portion of tetra- (<italic>n</italic> = 86), penta- (<italic>n</italic> = 14), and hexa-nucleotide SSRs (<italic>n</italic> = 19) were detected in <italic>P. alkekengi</italic> transcripts, it was significant. <italic>P. peruviana</italic> sequences showed nearly the same tendency and had more SSRs than <italic>P. alkekengi</italic>, especially mono- and tri-nucleotide SSRs. There were small numbers of tetra-, penta- and hexa-nucleotide SSRs in our transcriptome sequences from the two species, implying that their base patterns were highly complex. The SSRs of both <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> may yield potential genetic markers for a wide range of investigations including population genetics-, comparative genomic-, and gene-based association studies aimed at elucidating the genetic control of important traits.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Statistics of SSRs detected in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic>.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Summary of microsatellite search</th>
<th valign="top" align="center"><italic>P. alkekengi</italic></th>
<th valign="top" align="center"><italic>P. peruviana</italic></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Total number of identified SSRs</td>
<td valign="top" align="center">11,415</td>
<td valign="top" align="center">12,180</td>
</tr>
<tr>
<td valign="top" align="left">Number of SSR-containing unigenes</td>
<td valign="top" align="center">9,565</td>
<td valign="top" align="center">9,520</td>
</tr>
<tr>
<td valign="top" align="left">Number of unigenes containing more than 1 SSR</td>
<td valign="top" align="center">1,464</td>
<td valign="top" align="center">2,013</td>
</tr>
<tr>
<td valign="top" align="left">Number of SSRs present in compound formation</td>
<td valign="top" align="center">756</td>
<td valign="top" align="center">1,025</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Distribution to different type of repeats</italic></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic># of SSRs (unit size = 1)</italic></td>
<td valign="top" align="center">6,955</td>
<td valign="top" align="center">7,364</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="center">2,078</td>
<td valign="top" align="center">1,980</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="center">2,263</td>
<td valign="top" align="center">2,721</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="center">86</td>
<td valign="top" align="center">83</td></tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="center">14</td>
<td valign="top" align="center">14</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">18</td></tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec><title>Conclusion</title>
<p>We present the comprehensive transcriptome of the leaves of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> and provide a large-scale resource for assembled and functionally annotated gene candidates. Deep transcriptome analysis provided 75,221 unigenes in <italic>P. alkekengi</italic> and 54,513 in <italic>P. peruviana</italic>, respectively. A BLAST search of these sequences identified 40,090 and 33,183 unigenes in <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> as annotated proteins, respectively. We discussed our findings on the gene candidates putatively involved in withanolide biosynthesis and their transcript- and metabolite profiles. Our detection of 11,415 SSRs in <italic>P. alkekengi</italic> and 12,180 SSRs in <italic>P. peruviana</italic> provides a useful resource for population genetics studies, genetic map construction, and genetic diversity assessment in <italic>Physalis</italic>. Because the <italic>Physalis</italic> genus is valuable for producing medicines and functional foods, more genomic data on other members are needed. Our study suggests that comprehensive approaches applied within the family can provide a clue to gene discovery in <italic>Physalis</italic> and yield insights into their complex diversity. Given the insufficient knowledge on the molecular mechanisms controlling the biosynthetic pathways involved in various bioactive metabolites like withanolides, the transcriptome information reported here represents an important public resource for further study on the specialized metabolism of <italic>Physalis</italic> species.</p>
</sec>
<sec><title>Data Accessibility</title>
<p>All raw read sequences in FASTQ format can be downloaded from the DDBJ Sequence Read Archive (<xref ref-type="bibr" rid="B23">Kosuge et al., 2014</xref>) under accession number DRA004085. Our assembled transcripts were deposited as a Transcriptome Shotgun Assembly (TSA) in GenBank/EMBL/DDBJ under the accession IABG01000001-IABG01075221 (75221 entries for <italic>P. alkekengi</italic>) and IABH01000001-IABH01054513 (54513 entries for <italic>P. peruviana</italic>).</p>
</sec>
<sec><title>Author Contributions</title>
<p>Conceived and designed the experiments: AF, HS, MY, MS, and KS. Performed the experiments: MN, HS, MY, TM, MM, GH, and MS. Analyzed the data: AF, EK, NU, TM, and HS. Contributed reagents/materials/analysis tools: MN, HS, MY, TM, MM, GH, and MS. Wrote the paper: AF, EK, and KS. All authors read and approved the final manuscript.</p>
</sec>
<sec><title>Conflict of Interest Statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<ack>
<p>This study was supported, in part, by Studies on enhancement of &#x2019;Comprehensive Medicinal Plant Database&#x2019; aiming for cultivation of medicinal plants and industrial development, a Health and Labour Sciences Research Grant, a Japan Agency for Medical Research and Development Sciences Research Grant, the Japan Advanced Plant Science Research Network, and Strategic Priority Research Promotion Program of Chiba University. Research by EK was financially supported by the Carlsberg Foundation. We thank Dr. Masaaki Ozawa (RIKEN Center for Sustainable Resource Science) for experimental assistance, Ms. Ursula Petralia and Prof. Miyako Kusano (University of Tsukuba) for editorial assistance, and Dr. Tetsuya Sakurai and Mr. Yutaka Yamada (RIKEN Center for Sustainable Resource Science) for computational assistance. We also thank Ms. Sayaka Shinpo (Kazusa DNA Research Institute) for technical support in Illumina sequencing.</p>
</ack>
<sec sec-type="supplementary material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="http://journal.frontiersin.org/article/10.3389/fpls.2016.01883/full#supplementary-material">http://journal.frontiersin.org/article/10.3389/fpls.2016.01883/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image_1.TIF" id="SM1" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>IMAGE 1</label>
<caption><p><bold>Schematic workflow of this study.</bold> We identified 75,221 and 54,513 transcripts in leaves of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> with the Trinity program (<xref ref-type="bibr" rid="B14">Grabherr et al., 2011</xref>). Assembled unigenes were annotated by Blast2GO program (<xref ref-type="bibr" rid="B2">Conesa et al., 2005</xref>).</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_1.TIF" id="SM7" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_2.TIF" id="SM2" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>IMAGE 2</label>
<caption><p><bold>Structures of complex and oxidized steroidal constituents isolated from <italic>Physalis</italic> plants.</bold> We analyzed the metabolite content in leaf tissues of <italic>P. alkekengi</italic> and <italic>P. peruviana</italic> at five different developmental stages by liquid chromatography-quadrupole time-of-flight-mass spectrometry (LC-QTOF-MS), focusing on these six withanolide metabolites.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_2.TIF" id="SM8" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_1.XLSX" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_2.XLSX" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_3.XLSX" id="SM5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_4.XLSX" id="SM6" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Altschul</surname> <given-names>S. F.</given-names></name> <name><surname>Gish</surname> <given-names>W.</given-names></name> <name><surname>Miller</surname> <given-names>W.</given-names></name> <name><surname>Myers</surname> <given-names>E. W.</given-names></name> <name><surname>Lipman</surname> <given-names>D. J.</given-names></name></person-group> (<year>1990</year>). <article-title>Basic local alignment search tool.</article-title> <source><italic>J. Mol. Biol.</italic></source> <volume>215</volume> <fpage>403</fpage>&#x2013;<lpage>410</lpage>. <pub-id pub-id-type="doi">10.1016/S0022-2836(05)80360-2</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Conesa</surname> <given-names>A.</given-names></name> <name><surname>Gotz</surname> <given-names>S.</given-names></name> <name><surname>Garcia-Gomez</surname> <given-names>J. M.</given-names></name> <name><surname>Terol</surname> <given-names>J.</given-names></name> <name><surname>Talon</surname> <given-names>M.</given-names></name> <name><surname>Robles</surname> <given-names>M.</given-names></name></person-group> (<year>2005</year>). <article-title>Blast2GO: a universal tool for annotation, visualization and analysis in functional genomics research.</article-title> <source><italic>Bioinformatics</italic></source> <volume>21</volume> <fpage>3674</fpage>&#x2013;<lpage>3676</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bti610</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eich</surname> <given-names>E.</given-names></name></person-group> (<year>2008</year>). <source><italic>Terpenoids (Isoprenoids)</italic>.</source> <publisher-loc>Berlin</publisher-loc>: <publisher-name>Springer</publisher-name>.</citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fukushima</surname> <given-names>A.</given-names></name> <name><surname>Kanaya</surname> <given-names>S.</given-names></name> <name><surname>Nishida</surname> <given-names>K.</given-names></name></person-group> (<year>2014</year>). <article-title>Integrated network analysis and effective tools in plant systems biology.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>5</volume>:<issue>598</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2014.00598</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fukushima</surname> <given-names>A.</given-names></name> <name><surname>Kusano</surname> <given-names>M.</given-names></name></person-group> (<year>2014</year>). <article-title>A network perspective on nitrogen metabolism from model to crop plants using integrated &#x2019;omics&#x2019; approaches.</article-title> <source><italic>J. Exp. Bot.</italic></source> <volume>65</volume> <fpage>5619</fpage>&#x2013;<lpage>5630</lpage>. <pub-id pub-id-type="doi">10.1093/jxb/eru322</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fukushima</surname> <given-names>A.</given-names></name> <name><surname>Nakamura</surname> <given-names>M.</given-names></name> <name><surname>Suzuki</surname> <given-names>H.</given-names></name> <name><surname>Saito</surname> <given-names>K.</given-names></name> <name><surname>Yamazaki</surname> <given-names>M.</given-names></name></person-group> (<year>2015</year>). <article-title>High-throughput sequencing and de novo assembly of red and green forms of the perilla frutescens var. crispa transcriptome.</article-title> <source><italic>PLoS ONE</italic></source> <volume>10</volume>:<issue>e0129154</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0129154</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Garber</surname> <given-names>M.</given-names></name> <name><surname>Grabherr</surname> <given-names>M. G.</given-names></name> <name><surname>Guttman</surname> <given-names>M.</given-names></name> <name><surname>Trapnell</surname> <given-names>C.</given-names></name></person-group> (<year>2011</year>). <article-title>Computational methods for transcriptome annotation and quantification using RNA-seq.</article-title> <source><italic>Nat. Methods</italic></source> <volume>8</volume> <fpage>469</fpage>&#x2013;<lpage>477</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.1613</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Garzon-Martinez</surname> <given-names>G. A.</given-names></name> <name><surname>Zhu</surname> <given-names>Z. I.</given-names></name> <name><surname>Landsman</surname> <given-names>D.</given-names></name> <name><surname>Barrero</surname> <given-names>L. S.</given-names></name> <name><surname>Marino-Ramirez</surname> <given-names>L.</given-names></name></person-group> (<year>2012</year>). <article-title>The <italic>Physalis peruviana</italic> leaf transcriptome: assembly, annotation and gene model prediction.</article-title> <source><italic>BMC Genomics</italic></source> <volume>13</volume>:<issue>151</issue>. <pub-id pub-id-type="doi">10.1186/1471-2164-13-151</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gongora-Castillo</surname> <given-names>E.</given-names></name> <name><surname>Buell</surname> <given-names>C. R.</given-names></name></person-group> (<year>2013</year>). <article-title>Bioinformatics challenges in de novo transcriptome assembly using short read sequences in the absence of a reference genome sequence.</article-title> <source><italic>Nat. Prod. Rep.</italic></source> <volume>30</volume> <fpage>490</fpage>&#x2013;<lpage>500</lpage>. <pub-id pub-id-type="doi">10.1039/c3np20099j</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gongora-Castillo</surname> <given-names>E.</given-names></name> <name><surname>Childs</surname> <given-names>K. L.</given-names></name> <name><surname>Fedewa</surname> <given-names>G.</given-names></name> <name><surname>Hamilton</surname> <given-names>J. P.</given-names></name> <name><surname>Liscombe</surname> <given-names>D. K.</given-names></name> <name><surname>Magallanes-Lundback</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2012a</year>). <article-title>Development of transcriptomic resources for interrogating the biosynthesis of monoterpene indole alkaloids in medicinal plant species.</article-title> <source><italic>PLoS ONE</italic></source> <volume>7</volume>:<issue>e52506</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0052506</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gongora-Castillo</surname> <given-names>E.</given-names></name> <name><surname>Fedewa</surname> <given-names>G.</given-names></name> <name><surname>Yeo</surname> <given-names>Y.</given-names></name> <name><surname>Chappell</surname> <given-names>J.</given-names></name> <name><surname>Dellapenna</surname> <given-names>D.</given-names></name> <name><surname>Buell</surname> <given-names>C. R.</given-names></name></person-group> (<year>2012b</year>). <article-title>Genomic approaches for interrogating the biochemistry of medicinal plant species.</article-title> <source><italic>Methods Enzymol.</italic></source> <volume>517</volume> <fpage>139</fpage>&#x2013;<lpage>159</lpage>. <pub-id pub-id-type="doi">10.1016/B978-0-12-404634-4.00007-3</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gordo</surname> <given-names>S. M.</given-names></name> <name><surname>Pinheiro</surname> <given-names>D. G.</given-names></name> <name><surname>Moreira</surname> <given-names>E. C.</given-names></name> <name><surname>Rodrigues</surname> <given-names>S. M.</given-names></name> <name><surname>Poltronieri</surname> <given-names>M. C.</given-names></name> <name><surname>De Lemos</surname> <given-names>O. F.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>High-throughput sequencing of black pepper root transcriptome.</article-title> <source><italic>BMC Plant Biol.</italic></source> <volume>12</volume>:<issue>168</issue>. <pub-id pub-id-type="doi">10.1186/1471-2229-12-168</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Goto</surname> <given-names>N.</given-names></name> <name><surname>Prins</surname> <given-names>P.</given-names></name> <name><surname>Nakao</surname> <given-names>M.</given-names></name> <name><surname>Bonnal</surname> <given-names>R.</given-names></name> <name><surname>Aerts</surname> <given-names>J.</given-names></name> <name><surname>Katayama</surname> <given-names>T.</given-names></name></person-group> (<year>2010</year>). <article-title>BioRuby: bioinformatics software for the Ruby programming language.</article-title> <source><italic>Bioinformatics</italic></source> <volume>26</volume> <fpage>2617</fpage>&#x2013;<lpage>2619</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btq475</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grabherr</surname> <given-names>M. G.</given-names></name> <name><surname>Haas</surname> <given-names>B. J.</given-names></name> <name><surname>Yassour</surname> <given-names>M.</given-names></name> <name><surname>Levin</surname> <given-names>J. Z.</given-names></name> <name><surname>Thompson</surname> <given-names>D. A.</given-names></name> <name><surname>Amit</surname> <given-names>I.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Full-length transcriptome assembly from RNA-Seq data without a reference genome.</article-title> <source><italic>Nat. Biotechnol.</italic></source> <volume>29</volume> <fpage>644</fpage>&#x2013;<lpage>652</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1883</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gupta</surname> <given-names>P.</given-names></name> <name><surname>Goel</surname> <given-names>R.</given-names></name> <name><surname>Agarwal</surname> <given-names>A. V.</given-names></name> <name><surname>Asif</surname> <given-names>M. H.</given-names></name> <name><surname>Sangwan</surname> <given-names>N. S.</given-names></name> <name><surname>Sangwan</surname> <given-names>R. S.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Comparative transcriptome analysis of different chemotypes elucidates withanolide biosynthesis pathway from medicinal plant <italic>Withania somnifera</italic>.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>5</volume>:<issue>18611</issue>. <pub-id pub-id-type="doi">10.1038/srep18611</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gupta</surname> <given-names>P.</given-names></name> <name><surname>Goel</surname> <given-names>R.</given-names></name> <name><surname>Pathak</surname> <given-names>S.</given-names></name> <name><surname>Srivastava</surname> <given-names>A.</given-names></name> <name><surname>Singh</surname> <given-names>S. P.</given-names></name> <name><surname>Sangwan</surname> <given-names>R. S.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>De novo assembly, functional annotation and comparative analysis of <italic>Withania somnifera</italic> leaf and root transcriptomes to identify putative genes involved in the withanolides biosynthesis.</article-title> <source><italic>PLoS ONE</italic></source> <volume>8</volume>:<issue>e62714</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0062714</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Han</surname> <given-names>R.</given-names></name> <name><surname>Takahashi</surname> <given-names>H.</given-names></name> <name><surname>Nakamura</surname> <given-names>M.</given-names></name> <name><surname>Bunsupa</surname> <given-names>S.</given-names></name> <name><surname>Yoshimoto</surname> <given-names>N.</given-names></name> <name><surname>Yamamoto</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2015a</year>). <article-title>Transcriptome analysis of nine tissues to discover genes involved in the biosynthesis of active ingredients in sophora flavescens.</article-title> <source><italic>Biol. Pharm. Bull.</italic></source> <volume>38</volume> <fpage>876</fpage>&#x2013;<lpage>883</lpage>. <pub-id pub-id-type="doi">10.1248/bpb.b14-00834</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Han</surname> <given-names>R.</given-names></name> <name><surname>Takahashi</surname> <given-names>H.</given-names></name> <name><surname>Nakamura</surname> <given-names>M.</given-names></name> <name><surname>Yoshimoto</surname> <given-names>N.</given-names></name> <name><surname>Suzuki</surname> <given-names>H.</given-names></name> <name><surname>Shibata</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2015b</year>). <article-title>Transcriptomic landscape of <italic>Pueraria lobata</italic> demonstrates potential for phytochemical study.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>6</volume>:<issue>426</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2015.00426</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hancock</surname> <given-names>J. M.</given-names></name></person-group> (<year>1996</year>). <article-title>Simple sequences in a &#x201D;minimal&#x2019; genome.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>14</volume> <fpage>14</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1038/ng0996-14</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jacobo-Herrera</surname> <given-names>N. J.</given-names></name> <name><surname>Bremner</surname> <given-names>P.</given-names></name> <name><surname>Marquez</surname> <given-names>N.</given-names></name> <name><surname>Gupta</surname> <given-names>M. P.</given-names></name> <name><surname>Gibbons</surname> <given-names>S.</given-names></name> <name><surname>Munoz</surname> <given-names>E.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>Physalins from <italic>Witheringia solanacea</italic> as modulators of the NF-kappaB cascade.</article-title> <source><italic>J. Nat. Prod.</italic></source> <volume>69</volume> <fpage>328</fpage>&#x2013;<lpage>331</lpage>. <pub-id pub-id-type="doi">10.1021/np050225t</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kanehisa</surname> <given-names>M.</given-names></name> <name><surname>Goto</surname> <given-names>S.</given-names></name> <name><surname>Sato</surname> <given-names>Y.</given-names></name> <name><surname>Kawashima</surname> <given-names>M.</given-names></name> <name><surname>Furumichi</surname> <given-names>M.</given-names></name> <name><surname>Tanabe</surname> <given-names>M.</given-names></name></person-group> (<year>2014</year>). <article-title>Data, information, knowledge and principle: back to metabolism in KEGG.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>42</volume> <fpage>D199</fpage>&#x2013;<lpage>D205</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkt1076</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kawai</surname> <given-names>M.</given-names></name> <name><surname>Makino</surname> <given-names>B.</given-names></name> <name><surname>Yamamura</surname> <given-names>H.</given-names></name> <name><surname>Araki</surname> <given-names>S.</given-names></name> <name><surname>Butsugan</surname> <given-names>Y.</given-names></name> <name><surname>Ohya</surname> <given-names>J.</given-names></name></person-group> (<year>2002</year>). <article-title>Cytotoxic activity of physalins and related compounds against HeLa cells.</article-title> <source><italic>Pharmazie</italic></source> <volume>57</volume> <fpage>348</fpage>&#x2013;<lpage>350</lpage>.</citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kosuge</surname> <given-names>T.</given-names></name> <name><surname>Mashima</surname> <given-names>J.</given-names></name> <name><surname>Kodama</surname> <given-names>Y.</given-names></name> <name><surname>Fujisawa</surname> <given-names>T.</given-names></name> <name><surname>Kaminuma</surname> <given-names>E.</given-names></name> <name><surname>Ogasawara</surname> <given-names>O.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>DDBJ progress report: a new submission system for leading to a correct annotation.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>42</volume> <fpage>D44</fpage>&#x2013;<lpage>D49</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkt1066</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Langmead</surname> <given-names>B.</given-names></name> <name><surname>Trapnell</surname> <given-names>C.</given-names></name> <name><surname>Pop</surname> <given-names>M.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2009</year>). <article-title>Ultrafast and memory-efficient alignment of short DNA sequences to the human genome.</article-title> <source><italic>Genome Biol.</italic></source> <volume>10</volume>:<issue>R25</issue>. <pub-id pub-id-type="doi">10.1186/gb-2009-10-3-r25</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lei</surname> <given-names>B.</given-names></name> <name><surname>Lu</surname> <given-names>K.</given-names></name> <name><surname>Ding</surname> <given-names>F.</given-names></name> <name><surname>Zhang</surname> <given-names>K.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Zhao</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>RNA sequencing analysis reveals transcriptomic variations in tobacco (<italic>Nicotiana tabacum</italic>) leaves affected by climate, soil, and tillage factors.</article-title> <source><italic>Int. J. Mol. Sci.</italic></source> <volume>15</volume> <fpage>6137</fpage>&#x2013;<lpage>6160</lpage>. <pub-id pub-id-type="doi">10.3390/ijms15046137</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>B.</given-names></name> <name><surname>Dewey</surname> <given-names>C. N.</given-names></name></person-group> (<year>2011</year>). <article-title>RSEM: accurate transcript quantification from RNA-Seq data with or without a reference genome.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>12</volume>:<issue>323</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-12-323</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Zhao</surname> <given-names>J.</given-names></name> <name><surname>Yang</surname> <given-names>M.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Li</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Physalins and withanolides from the fruits of <italic>Physalis alkekengi</italic> L. var. franchetii (Mast.) Makino and the inhibitory activities against human tumor cells.</article-title> <source><italic>Phytochem. Lett.</italic></source> <volume>10</volume> <fpage>95</fpage>&#x2013;<lpage>100</lpage>. <pub-id pub-id-type="doi">10.1016/j.phytol.2014.08.004</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lockley</surname> <given-names>W. J. S.</given-names></name> <name><surname>Rees</surname> <given-names>H. H.</given-names></name> <name><surname>Goodwin</surname> <given-names>T. W.</given-names></name></person-group> (<year>1976</year>). <article-title>Biosynthesis of steroidal withanolides in <italic>Withania somnifera</italic>.</article-title> <source><italic>Phytochemistry</italic></source> <volume>15</volume> <fpage>937</fpage>&#x2013;<lpage>939</lpage>. <pub-id pub-id-type="doi">10.1016/S0031-9422(00)84374-5</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martinez</surname> <given-names>M.</given-names></name></person-group> (<year>1998</year>). <article-title>Revision of <italic>Physalis</italic> section epiteiorhiza (Solanaceae).</article-title> <source><italic>Anal. Inst. Biol. Serie Bot.</italic></source> <volume>69</volume> <fpage>71</fpage>&#x2013;<lpage>117</lpage>.</citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Matsuura</surname> <given-names>T.</given-names></name> <name><surname>Kawai</surname> <given-names>M.</given-names></name></person-group> (<year>1969</year>). <article-title>Bitter principles of physalis alkekengi var francheti: structure of physalin B.</article-title> <source><italic>Tetrahedron Lett.</italic></source> <volume>10</volume> <fpage>1765</fpage>&#x2013;<lpage>1766</lpage>. <pub-id pub-id-type="doi">10.1016/S0040-4039(01)88006-0</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Matsuura</surname> <given-names>T.</given-names></name> <name><surname>Kawai</surname> <given-names>M.</given-names></name> <name><surname>Nakashima</surname> <given-names>R.</given-names></name> <name><surname>Butsugan</surname> <given-names>Y.</given-names></name></person-group> (<year>1969</year>). <article-title>Bitter principles of <italic>Physalis alkekengi</italic> var francheti: structure of physalin a.</article-title> <source><italic>Tetrahedron Lett.</italic></source> <volume>10</volume> <fpage>1083</fpage>&#x2013;<lpage>1086</lpage>. <pub-id pub-id-type="doi">10.1016/S0040-4039(01)88006-0</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morgan</surname> <given-names>M.</given-names></name> <name><surname>Anders</surname> <given-names>S.</given-names></name> <name><surname>Lawrence</surname> <given-names>M.</given-names></name> <name><surname>Aboyoun</surname> <given-names>P.</given-names></name> <name><surname>Pages</surname> <given-names>H.</given-names></name> <name><surname>Gentleman</surname> <given-names>R.</given-names></name></person-group> (<year>2009</year>). <article-title>ShortRead: a bioconductor package for input, quality assessment and exploration of high-throughput sequence data.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>2607</fpage>&#x2013;<lpage>2608</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp450</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Osorio</surname> <given-names>S.</given-names></name> <name><surname>Ruan</surname> <given-names>Y. L.</given-names></name> <name><surname>Fernie</surname> <given-names>A. R.</given-names></name></person-group> (<year>2014</year>). <article-title>An update on source-to-sink carbon partitioning in tomato.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>5</volume>:<issue>516</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2014.00516</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ozawa</surname> <given-names>M.</given-names></name> <name><surname>Morita</surname> <given-names>M.</given-names></name> <name><surname>Hirai</surname> <given-names>G.</given-names></name> <name><surname>Tamura</surname> <given-names>S.</given-names></name> <name><surname>Kawai</surname> <given-names>M.</given-names></name> <name><surname>Tsuchiya</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Contribution of cage-shaped structure of physalins to their mode of action in inhibition of NF-kappaB activation.</article-title> <source><italic>ACS Med. Chem. Lett.</italic></source> <volume>4</volume> <fpage>730</fpage>&#x2013;<lpage>735</lpage>. <pub-id pub-id-type="doi">10.1021/ml400144e</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pages</surname> <given-names>H.</given-names></name> <name><surname>Aboyoun</surname> <given-names>P.</given-names></name> <name><surname>Gentleman</surname> <given-names>R.</given-names></name> <name><surname>Debroy</surname> <given-names>S.</given-names></name></person-group> (<year>2009</year>). <source><italic>Biostrings: String Objects Representing Biological Sequences, and Matching Algorithms. R Package Version 2.32.1</italic>.</source> Available at: <ext-link ext-link-type="uri" xlink:href="http://bioconductor.org/packages/Biostrings/">http://bioconductor.org/packages/Biostrings/</ext-link></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ramadan</surname> <given-names>M. F.</given-names></name> <name><surname>Morsel</surname> <given-names>J. T.</given-names></name></person-group> (<year>2003</year>). <article-title>Oil goldenberry (<italic>Physalis peruviana</italic> L.).</article-title> <source><italic>J. Agric. Food Chem.</italic></source> <volume>51</volume> <fpage>969</fpage>&#x2013;<lpage>974</lpage>. <pub-id pub-id-type="doi">10.1021/jf020778z</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ramanan</surname> <given-names>V. K.</given-names></name> <name><surname>Shen</surname> <given-names>L.</given-names></name> <name><surname>Moore</surname> <given-names>J. H.</given-names></name> <name><surname>Saykin</surname> <given-names>A. J.</given-names></name></person-group> (<year>2012</year>). <article-title>Pathway analysis of genomic data: concepts, methods, and prospects for future development.</article-title> <source><italic>Trends Genet.</italic></source> <volume>28</volume> <fpage>323</fpage>&#x2013;<lpage>332</lpage>. <pub-id pub-id-type="doi">10.1016/j.tig.2012.03.004</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ramesh</surname> <given-names>K. R.</given-names></name> <name><surname>Hemalatha</surname> <given-names>R.</given-names></name> <name><surname>Vijayendra</surname> <given-names>C. A.</given-names></name> <name><surname>Arshi</surname> <given-names>U. Z.</given-names></name> <name><surname>Dushyant</surname> <given-names>S. B.</given-names></name> <name><surname>Dinesh</surname> <given-names>K. B.</given-names></name></person-group> (<year>2016</year>). <article-title>Transcriptome analysis of <italic>Solanum melongena</italic> L. (eggplant) fruit to identify putative allergens and their epitopes.</article-title> <source><italic>Gene</italic></source> <volume>576</volume> <fpage>64</fpage>&#x2013;<lpage>71</lpage>. <pub-id pub-id-type="doi">10.1016/j.gene.2015.09.064</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Senthil</surname> <given-names>K.</given-names></name> <name><surname>Jayakodi</surname> <given-names>M.</given-names></name> <name><surname>Thirugnanasambantham</surname> <given-names>P.</given-names></name> <name><surname>Lee</surname> <given-names>S. C.</given-names></name> <name><surname>Duraisamy</surname> <given-names>P.</given-names></name> <name><surname>Purushotham</surname> <given-names>P. M.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Transcriptome analysis reveals in vitro cultured <italic>Withania somnifera</italic> leaf and root tissues as a promising source for targeted withanolide biosynthesis.</article-title> <source><italic>BMC Genomics</italic></source> <volume>16</volume>:<issue>14</issue>. <pub-id pub-id-type="doi">10.1186/s12864-015-1214-0</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tamura</surname> <given-names>M.</given-names></name> <name><surname>Tsuji</surname> <given-names>Y.</given-names></name> <name><surname>Kusunose</surname> <given-names>T.</given-names></name> <name><surname>Okazawa</surname> <given-names>A.</given-names></name> <name><surname>Kamimura</surname> <given-names>N.</given-names></name> <name><surname>Mori</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Successful expression of a novel bacterial gene for pinoresinol reductase and its effect on lignan biosynthesis in transgenic <italic>Arabidopsis thaliana</italic>.</article-title> <source><italic>Appl. Microbiol. Biotechnol.</italic></source> <volume>98</volume> <fpage>8165</fpage>&#x2013;<lpage>8177</lpage>. <pub-id pub-id-type="doi">10.1007/s00253-014-5934-x</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><collab>The Gene Ontology Consortium</collab> (<year>2014</year>). <article-title>Gene ontology consortium: going forward.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>43</volume> <fpage>D1049</fpage>&#x2013;<lpage>D1056</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gku1179</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thiel</surname> <given-names>T.</given-names></name> <name><surname>Michalek</surname> <given-names>W.</given-names></name> <name><surname>Varshney</surname> <given-names>R. K.</given-names></name> <name><surname>Graner</surname> <given-names>A.</given-names></name></person-group> (<year>2003</year>). <article-title>Exploiting EST databases for the development and characterization of gene-derived SSR-markers in barley (<italic>Hordeum vulgare</italic> L.).</article-title> <source><italic>Theor. Appl. Genet.</italic></source> <volume>106</volume> <fpage>411</fpage>&#x2013;<lpage>422</lpage>. <pub-id pub-id-type="doi">10.1007/s00122-002-1031-0</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Varshney</surname> <given-names>R. K.</given-names></name> <name><surname>Graner</surname> <given-names>A.</given-names></name> <name><surname>Sorrells</surname> <given-names>M. E.</given-names></name></person-group> (<year>2005</year>). <article-title>Genic microsatellite markers in plants: features and applications.</article-title> <source><italic>Trends Biotechnol.</italic></source> <volume>23</volume> <fpage>48</fpage>&#x2013;<lpage>55</lpage>. <pub-id pub-id-type="doi">10.1016/j.tibtech.2004.11.005</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Z.</given-names></name> <name><surname>Gerstein</surname> <given-names>M.</given-names></name> <name><surname>Snyder</surname> <given-names>M.</given-names></name></person-group> (<year>2009</year>). <article-title>RNA-Seq: a revolutionary tool for transcriptomics.</article-title> <source><italic>Nat. Rev. Genet.</italic></source> <volume>10</volume> <fpage>57</fpage>&#x2013;<lpage>63</lpage>. <pub-id pub-id-type="doi">10.1038/nrg2484</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Weber</surname> <given-names>A. P.</given-names></name></person-group> (<year>2015</year>). <article-title>Discovering new biology through sequencing of RNA.</article-title> <source><italic>Plant Physiol.</italic></source> <volume>169</volume> <fpage>1524</fpage>&#x2013;<lpage>1531</lpage>. <pub-id pub-id-type="doi">10.1104/pp.15.01081</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>S. Y.</given-names></name> <name><surname>Leu</surname> <given-names>Y. L.</given-names></name> <name><surname>Chang</surname> <given-names>Y. L.</given-names></name> <name><surname>Wu</surname> <given-names>T. S.</given-names></name> <name><surname>Kuo</surname> <given-names>P. C.</given-names></name> <name><surname>Liao</surname> <given-names>Y. R.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Physalin F induces cell apoptosis in human renal carcinoma cells by targeting NF-kappaB and generating reactive oxygen species.</article-title> <source><italic>PLoS ONE</italic></source> <volume>7</volume>:<issue>e40727</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0040727</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xiong</surname> <given-names>Q.</given-names></name> <name><surname>Wilson</surname> <given-names>W. K.</given-names></name> <name><surname>Matsuda</surname> <given-names>S. P.</given-names></name></person-group> (<year>2006</year>). <article-title>An <italic>Arabidopsis</italic> oxidosqualene cyclase catalyzes iridal skeleton formation by grob fragmentation.</article-title> <source><italic>Angew. Chem. Int. Ed. Engl</italic></source> <volume>45</volume> <fpage>1285</fpage>&#x2013;<lpage>1288</lpage>. <pub-id pub-id-type="doi">10.1002/anie.200503420</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yamazaki</surname> <given-names>M.</given-names></name> <name><surname>Shibata</surname> <given-names>M.</given-names></name> <name><surname>Nishiyama</surname> <given-names>Y.</given-names></name> <name><surname>Springob</surname> <given-names>K.</given-names></name> <name><surname>Kitayama</surname> <given-names>M.</given-names></name> <name><surname>Shimada</surname> <given-names>N.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>Differential gene expression profiles of red and green forms of <italic>Perilla frutescens</italic> leading to comprehensive identification of anthocyanin biosynthetic genes.</article-title> <source><italic>FEBS J.</italic></source> <volume>275</volume> <fpage>3494</fpage>&#x2013;<lpage>3502</lpage>. <pub-id pub-id-type="doi">10.1111/j.1742-4658.2008.06496.x</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ye</surname> <given-names>J.</given-names></name> <name><surname>Fang</surname> <given-names>L.</given-names></name> <name><surname>Zheng</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>Z.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>WEGO: a web tool for plotting GO annotations.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>34</volume> <fpage>W293</fpage>&#x2013;<lpage>W297</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkl031</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yen</surname> <given-names>C. Y.</given-names></name> <name><surname>Chiu</surname> <given-names>C. C.</given-names></name> <name><surname>Chang</surname> <given-names>F. R.</given-names></name> <name><surname>Chen</surname> <given-names>J. Y.</given-names></name> <name><surname>Hwang</surname> <given-names>C. C.</given-names></name> <name><surname>Hseu</surname> <given-names>Y. C.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>4beta-Hydroxywithanolide E from <italic>Physalis peruviana</italic> (golden berry) inhibits growth of human lung cancer cells through DNA damage, apoptosis and G2/M arrest.</article-title> <source><italic>BMC Cancer</italic></source> <volume>10</volume>:<issue>46</issue>. <pub-id pub-id-type="doi">10.1186/1471-2407-10-46</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yeo</surname> <given-names>Y. S.</given-names></name> <name><surname>Nybo</surname> <given-names>S. E.</given-names></name> <name><surname>Chittiboyina</surname> <given-names>A. G.</given-names></name> <name><surname>Weerasooriya</surname> <given-names>A. D.</given-names></name> <name><surname>Wang</surname> <given-names>Y. H.</given-names></name> <name><surname>Gongora-Castillo</surname> <given-names>E.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Functional identification of valerena-1,10-diene synthase, a terpene synthase catalyzing a unique chemical cascade in the biosynthesis of biologically active sesquiterpenes in <italic>Valeriana officinalis</italic>.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>288</volume> <fpage>3163</fpage>&#x2013;<lpage>3173</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.M112.415836</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn id="fn01"><label>1</label><p><ext-link ext-link-type="uri" xlink:href="http://medicinalplantgenomics.msu.edu/">http://medicinalplantgenomics.msu.edu/</ext-link></p></fn>
<fn id="fn02"><label>2</label><p><ext-link ext-link-type="uri" xlink:href="http://medplants.ncgr.org/">http://medplants.ncgr.org/</ext-link></p></fn>
<fn id="fn03"><label>3</label><p><ext-link ext-link-type="uri" xlink:href="http://hannonlab.cshl.edu/fastx_toolkit/">http://hannonlab.cshl.edu/fastx_toolkit/</ext-link></p></fn>
<fn id="fn04"><label>4</label><p><ext-link ext-link-type="uri" xlink:href="http://www.bioinformatics.babraham.ac.uk/projects/fastqc/">http://www.bioinformatics.babraham.ac.uk/projects/fastqc/</ext-link></p></fn>
<fn id="fn05"><label>5</label><p><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov">http://www.ncbi.nlm.nih.gov</ext-link></p></fn>
<fn id="fn06"><label>6</label><p><ext-link ext-link-type="uri" xlink:href="http://pgrc.ipk-gatersleben.de/misa/">http://pgrc.ipk-gatersleben.de/misa/</ext-link></p></fn>
</fn-group>
</back>
</article>