<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">635074</article-id>
<article-id pub-id-type="doi">10.3389/fmolb.2021.635074</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Molecular Biosciences</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Decoding Neuromuscular Disorders Using Phenotypic Clusters Obtained From Co-Occurrence Networks</article-title>
<alt-title alt-title-type="left-running-head">D&#xed;az-Santiago et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">Co-Occurrence Clusters in Neuromuscular Disorders</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>D&#xed;az-Santiago</surname>
<given-names>Elena</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1198199/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Claros</surname>
<given-names>M. Gonzalo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/231057/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yahyaoui</surname>
<given-names>Raquel</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>de Diego-Otero</surname>
<given-names>Yolanda</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1234331/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Calvo</surname>
<given-names>Roc&#xed;o</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hoenicka</surname>
<given-names>Janet</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/194295/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Palau</surname>
<given-names>Francesc</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<xref ref-type="aff" rid="aff7">
<sup>7</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1156143/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ranea</surname>
<given-names>Juan A. G.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1196994/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Perkins</surname>
<given-names>James R.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<label>
<sup>1</sup>
</label>Department of Molecular Biology and Biochemistry, Universidad de M&#xe1;laga, <addr-line>M&#xe1;laga</addr-line>, <country>Spain</country>
</aff>
<aff id="aff2">
<label>
<sup>2</sup>
</label>CIBER de Enfermedades Raras (CIBERER), <addr-line>Madrid</addr-line>, <country>Spain</country>
</aff>
<aff id="aff3">
<label>
<sup>3</sup>
</label>Institute of Biomedical Research in Malaga (IBIMA), IBIMA-RARE, <addr-line>M&#xe1;laga</addr-line>, <country>Spain</country>
</aff>
<aff id="aff4">
<label>
<sup>4</sup>
</label>Institute for Mediterranean and Subtropical Horticulture &#x201c;La Mayora&#x201d; (IHSM-UMA-CSIC), <addr-line>M&#xe1;laga</addr-line>, <country>Spain</country>
</aff>
<aff id="aff5">
<label>
<sup>5</sup>
</label>Laboratory of Metabolopathies and Neonatal Screening, M&#xe1;laga Regional University Hospital, <addr-line>M&#xe1;laga</addr-line>, <country>Spain</country>
</aff>
<aff id="aff6">
<label>
<sup>6</sup>
</label>Sant Joan de D&#xe9;u Hospital and Research Institute, <addr-line>Barcelona</addr-line>, <country>Spain</country>
</aff>
<aff id="aff7">
<label>
<sup>7</sup>
</label>Hospital Cl&#xed;nic and University of Barcelona School of Medicine and Health Sciences, <addr-line>Barcelona</addr-line>, <country>Spain</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/269299/overview">Silvia Bottini</ext-link>, Universit&#xe9; C&#xf4;te d&#x27;Azur, France</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/552766/overview">Tao Huang</ext-link>, Shanghai Institute of Nutrition and Health (CAS), China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/181238/overview">Filippo M. Santorelli</ext-link>, Fondazione Stella Maris (IRCCS), Italy</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/326927/overview">Yu-Hang Zhang</ext-link>, Brigham and Women&#x2019;s Hospital, United&#x20;States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: M. Gonzalo Claros, <email>claros@uma.es</email>
</corresp>
<fn fn-type="equal" id="fn1">
<label>
<sup>&#x2020;</sup>
</label>
<p>These authors have contributed equally to this&#x20;work</p>
</fn>
<fn fn-type="other">
<p>This article was submitted to Biological Modeling and Simulation, a section of the journal Frontiers in Molecular Biosciences</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>19</day>
<month>04</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>8</volume>
<elocation-id>635074</elocation-id>
<history>
<date date-type="received">
<day>29</day>
<month>11</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>15</day>
<month>02</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 D&#xed;az-Santiago, Claros, Yahyaoui, de Diego-Otero, Calvo, Hoenicka, Palau, Ranea and Perkins.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>D&#xed;az-Santiago, Claros, Yahyaoui, de Diego-Otero, Calvo, Hoenicka, Palau, Ranea and Perkins</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>Neuromuscular disorders (NMDs) represent an important subset of rare diseases associated with elevated morbidity and mortality whose diagnosis can take years. Here we present a novel approach using systems biology to produce functionally-coherent phenotype clusters that provide insight into the cellular functions and phenotypic patterns underlying NMDs, using the Human Phenotype Ontology as a common framework. Gene and phenotype information was obtained for 424 NMDs in OMIM and 126 NMDs in Orphanet, and 335 and 216 phenotypes were identified as typical for NMDs, respectively. &#x2018;Elevated serum creatine kinase&#x2019; was the most specific to NMDs, in agreement with the clinical test of elevated serum creatinine kinase that is conducted on NMD patients. The approach to obtain co-occurring NMD phenotypes was validated based on co-mention in PubMed abstracts. A total of 231 (OMIM) and 150 (Orphanet) clusters of highly connected co-occurrent NMD phenotypes were obtained. In parallel, a tripartite network based on phenotypes, diseases and genes was used to associate NMD phenotypes with functions, an approach also validated by literature co-mention, with KEGG pathways showing proportionally higher overlap than Gene Ontology and Reactome. Phenotype-function pairs were crossed with the co-occurrent NMD phenotype clusters to obtain 40 (OMIM) and 72 (Orphanet) functionally coherent phenotype clusters. As expected, many of these overlapped with known diseases and confirmed existing knowledge. Other clusters revealed interesting new findings, indicating informative phenotypes for differential diagnosis, providing deeper knowledge of NMDs, and pointing towards specific cell dysfunction caused by pleiotropic genes. This work is an example of reproducible research that i) can help better understand NMDs and support their diagnosis by providing a new tool that exploits existing information to obtain novel clusters of functionally-related phenotypes, and ii) takes us another step towards personalised medicine for&#x20;NMDs.</p>
</abstract>
<kwd-group>
<kwd>neuromuscular disorders</kwd>
<kwd>rare disease</kwd>
<kwd>phenotype</kwd>
<kwd>network analysis</kwd>
<kwd>cluster</kwd>
<kwd>co-occurrence analysis</kwd>
</kwd-group>
<contract-num rid="cn001">UMA18-FEDERJA- 102</contract-num>
<contract-num rid="cn002">PID2019-108096RB-C21 PID2019- 108096RB-C22 UMA18-FEDERJA-102 TIN2017-88728-C2-1-R</contract-num>
<contract-num rid="cn003">PID2019-108096RB-C21 PID2019-108096RB-C22 TIN2017-88728-C2-1-R</contract-num>
<contract-num rid="cn004">PI-0075- 2017</contract-num>
<contract-num rid="cn005">RD-XIX-ed</contract-num>
<contract-num rid="cn006">I Plan Propio</contract-num>
<contract-sponsor id="cn001">Consejer&#xed;a de Conocimiento, Investigaci&#xf3;n y Universidad, Junta de Andaluc&#xed;a<named-content content-type="fundref-id">10.13039/501100018943</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">European Regional Development Fund<named-content content-type="fundref-id">10.13039/501100008530</named-content>
</contract-sponsor>
<contract-sponsor id="cn003">Ministerio de Ciencia e Innovaci&#xf3;n<named-content content-type="fundref-id">10.13039/501100004837</named-content>
</contract-sponsor>
<contract-sponsor id="cn004">Fundaci&#xf3;n P&#xfa;blica Andaluza Progreso y Salud<named-content content-type="fundref-id">10.13039/501100015757</named-content>
</contract-sponsor>
<contract-sponsor id="cn005">Fundaci&#xf3;n Ram&#xf3;n Areces<named-content content-type="fundref-id">10.13039/100008054</named-content>
</contract-sponsor>
<contract-sponsor id="cn006">Universidad de M&#xe1;laga<named-content content-type="fundref-id">10.13039/100009473</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Neuromuscular disorders (NMDs) encompass a range of pathologies affecting muscle function (<xref ref-type="bibr" rid="B57">Roy et&#x20;al., 2015</xref>) that can be caused by problems in spinal motor neurones, peripheral nerves, muscles, and neuromuscular junctions. They affect 6&#x2013;8&#xa0;million people worldwide (<xref ref-type="bibr" rid="B62">Scotton et&#x20;al., 2014</xref>) and lead to elevated morbidity and mortality (<xref ref-type="bibr" rid="B40">Mccormack et&#x20;al., 2013</xref>). Many result from genomic mutations (<xref ref-type="bibr" rid="B36">Laing, 2012</xref>), although they can also be caused by autoimmune disorders and infections (<xref ref-type="bibr" rid="B35">Kraker and Zivkovi&#x107;, 2011</xref>). Around half manifest during childhood and classification is often based on the affected area (<xref ref-type="bibr" rid="B71">Turakhia et&#x20;al., 2013</xref>). Updated details of known mutations associated with NMDs are published yearly (<xref ref-type="bibr" rid="B7">Benarroch et&#x20;al., 2019</xref>) (<ext-link ext-link-type="uri" xlink:href="http://www.musclegenetable.fr/index.html">http://www.musclegenetable.fr/index.html</ext-link>). <xref ref-type="table" rid="T1">Table&#x20;1</xref> illustrates the main types of NMDs and shows their high heterogeneity in terms of clinical manifestation.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Classification of NMDs including some examples.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Type</th>
<th align="center">Description</th>
<th align="center">Examples</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Muscular dystrophies (MDs)</td>
<td align="left">Diseases causing weakness and degeneration of the skeletal muscles</td>
<td align="left">Myotonic dystrophy;facioscapulohumeral MD; EDMD; Duchenne MD; Becker MD; LGMDs; congenital MDs</td>
</tr>
<tr>
<td align="left">Myopathies</td>
<td align="left">Muscle diseases in which the muscle fibres do not function properly, resulting in muscle hypotonia and weakness</td>
<td align="left">Congenital myopathies; distal myopathies; endocrine myopathies; mitochondrial myopathies; metabolic myopathies</td>
</tr>
<tr>
<td align="left">Peripheral nerve diseases</td>
<td align="left">Diseases where motor and sensory nerves that connect the brain and spinal cord to the rest of the body are affected, causing impaired sensations, movements and muscular weakness</td>
<td align="left">Charcot-Marie-Tooth disease; Giant axonal neuropathy</td>
</tr>
<tr>
<td align="left">Motor neurone diseases</td>
<td align="left">Diseases where motor neurones progressively lose function, causing the muscles they control to become weak and eventually non-functional</td>
<td align="left">Hereditary spastic paraplegias; spinal muscular atrophy; spinal-bulbar muscular atrophy</td>
</tr>
<tr>
<td align="left">Ion channel diseases</td>
<td align="left">Diseases associated with defects in ion channels, typically marked by muscular weakness, absent muscle tone, or episodic muscle paralysis</td>
<td align="left">Andersen-Tawil syndrome; hyperkalemic periodic paralysis; hypokalemic periodic paralysis; myotonia congenita; paramyotonia congenita; potassium-aggravated myotonia</td>
</tr>
<tr>
<td align="left">Neuromuscular junction diseases</td>
<td align="left">Neuromuscular junction disorders that result from the destruction, malfunction or absence of one or more key proteins involved in the transmission of signals between muscles and nerves</td>
<td align="left">Congenital myasthenic syndromes; Lambert-Eaton myasthenic syndrome; myasthenia gravis</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>EDMD: Emery-Dreifuss muscular dystrophy; LGMDs: limb girdle muscular dystrophies.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Although diagnosis of NMDs has been aided in recent years by advances in whole-exome/genome sequencing (<xref ref-type="bibr" rid="B10">Brown and Meloche, 2016</xref>), it still requires a high level of medical specialisation, due to the high phenotypic and pathophysiology diversity, and large number of causal genes (<xref ref-type="bibr" rid="B41">McDonald, 2012</xref>; <xref ref-type="bibr" rid="B57">Roy et&#x20;al., 2015</xref>). Moreover, given that individual NMDs tend to be rare, it can be hard to find sufficient patients to conduct well-powered studies. As such, a range of diagnostic tests (including electrophysiology, tissue biopsies, and measuring levels of certain enzymes such as elevated serum creatinine kinase), and molecular imaging (<xref ref-type="bibr" rid="B70">Thavorntanaburt et&#x20;al., 2018</xref>) must be used, and diagnosis can be slow (<xref ref-type="bibr" rid="B68">Spuler et&#x20;al., 2011</xref>). There is no cure for most NMDs but rather symptomatic treatments to delay progression. Current research is focused on gene therapies and investigating new medications (<xref ref-type="bibr" rid="B61">Scoto et&#x20;al., 2018</xref>). However, efforts are hampered by their etiological heterogeneity and phenotype diversity.</p>
<p>Further work is needed to better understand how NMDs are related in terms of phenotypic overlap and underlying genes and mechanisms, in order to facilitate diagnosis and improve treatment. Although not specific to NMDs, previous studies have compared phenotypic profiles between different diseases to build clusters of related phenotypes (<xref ref-type="bibr" rid="B65">Sirota et&#x20;al., 2009</xref>; <xref ref-type="bibr" rid="B3">Bagley et&#x20;al., 2016</xref>); others have focused on phenotype-similarity based on co-morbidity across multiple diseases (<xref ref-type="bibr" rid="B58">Rzhetsky et&#x20;al., 2007</xref>; <xref ref-type="bibr" rid="B24">Hidalgo et&#x20;al., 2009</xref>). Such studies enable us to identify patterns between groups of diseases and phenotypes by showing how they tend to co-occur. This has multiple potential uses for disease classification and diagnosis. Further studies have investigated the connection between clinical manifestations in disease by integrating gene-disease and protein-protein interaction data (<xref ref-type="bibr" rid="B76">Yang et&#x20;al., 2011</xref>; <xref ref-type="bibr" rid="B27">Hwang et&#x20;al., 2012</xref>; <xref ref-type="bibr" rid="B82">Zhou et&#x20;al., 2014</xref>), as well as connecting proteins with phenotypes through the use of phenotypic clusters based on similarity and by predicting proteins associated with the phenotypes through machine learning (<xref ref-type="bibr" rid="B53">Ren et&#x20;al., 2020</xref>). These studies lead the way towards explaining the co-occurrence of phenotypic patterns across diseases through common underlying mechanisms.</p>
<p>There are several resources that map known diseases to their pathological phenotypes and associated genes. For example, MENDELIAN (<ext-link ext-link-type="uri" xlink:href="https://www.mendelian.co/es/">https://www.mendelian.co/es/</ext-link>) allows the symptom-guided search of rare diseases. OMIM (Online Mendelian Inheritance in Man) gathers data obtained <italic>via</italic> curation of the biomedical literature (<xref ref-type="bibr" rid="B21">Hamosh, 2004</xref>; <xref ref-type="bibr" rid="B2">Amberger et&#x20;al., 2019</xref>) to provide a clinical synopsis of all known Mendelian traits and disorders, describing genes, allelic variants and pathological phenotypes. Orphanet (<ext-link ext-link-type="uri" xlink:href="http://www.orphadata.org">http://www.orphadata.org</ext-link> and <ext-link ext-link-type="uri" xlink:href="https://www.orpha.net/">https://www.orpha.net/</ext-link>) is based on expert knowledge, gathering information about rare diseases specifically, with the aim of collecting and unifying the scarce knowledge available for such disorders, including NMDs of genetic origin. There are several tools that exploit these databases to associate disease-related phenotypes with genes, including <italic>Phen2Gene</italic> (<xref ref-type="bibr" rid="B81">Zhao et&#x20;al., 2020</xref>), <italic>AMELIE</italic> (<xref ref-type="bibr" rid="B9">Birgmeier et&#x20;al., 2020</xref>), <italic>Phevor</italic> (<xref ref-type="bibr" rid="B64">Singleton et&#x20;al., 2014</xref>), <italic>Phenolizer</italic> (<xref ref-type="bibr" rid="B75">Yang et&#x20;al., 2015</xref>) and <italic>Phenomizer</italic> (<xref ref-type="bibr" rid="B32">K&#xf6;hler et&#x20;al., 2009</xref>). Such studies require the use of common phenotype terminology in such a way that makes the information amenable to computational analysis (<xref ref-type="bibr" rid="B25">Hoehndorf et&#x20;al., 2015</xref>). The Human Phenotype Ontology (HPO, <ext-link ext-link-type="uri" xlink:href="https://hpo.jax.org/">https://hpo.jax.org/</ext-link>), provides such a standardised vocabulary to describe phenotypic abnormalities associated with more than 7&#x20;800 diseases (<xref ref-type="bibr" rid="B31">K&#xf6;hler et&#x20;al., 2021</xref>).</p>
<p>However, few studies have combined phenotype and gene information for groups of heterogeneous diseases to look for related phenotypes shared across multiple disorders with common underlying mechanisms. Such an approach was recently conducted by our group using patients with largely undiagnosed rare disorders (<xref ref-type="bibr" rid="B15">D&#xed;az-Santiago et&#x20;al., 2020</xref>), taking advantage of the rare-disease database DECIPHER (<xref ref-type="bibr" rid="B18">Firth et&#x20;al., 2009</xref>). This work showed that by using biomedical networks and systems medicine approaches our understanding of rare diseases can be improved based on phenotype co-occurrence patterns. It also showed the power of the re-analysis of existing data from public databases to obtain new knowledge, something that is recommended in the research community whenever possible (<xref ref-type="bibr" rid="B34">Kovalevskaya et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B69">Tan et&#x20;al., 2020</xref>). In this work, the automated workflow <italic>PhenoClusters</italic> is used to investigate phenotype co-occurrence across NMDs and produce functionally coherent clusters of phenotypes with similar underlying biological functions. This can help differentiate diagnosis (&#x2018;elevated serum creatine kinase&#x2019; is the most significant NMD phenotype) and provide a better understanding of NMDs (many clusters gather typical phenotypes and functions of NMDs) based on the specific cell functions (unanticipated phenotypes such as &#x2018;macroglossia&#x2019; and &#x2018;arthogryposis&#x2019; point to cell dysfunctions involved in an NMD), including those affected by pleiotropic/multi-functional&#x20;genes.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>2 Materials and Methods</title>
<sec id="s2-1">
<title>2.1&#x20;<italic>PhenoClusters</italic> Workflow</title>
<p>The <italic>PhenoClusters</italic> workflow described in this study is based on OMIM, Orphanet and HPO data and is outlined in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. The following sections describe its modules in more detail.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Flowchart of the <italic>PhenoClusters</italic> workflow. Module <bold>(A)</bold>: all diseases in OMIM and Orphanet were classified as &#x201c;NMDs&#x201d; or &#x201c;non-NMDs&#x201d;. HPO is then queried with those disease, retaining only those diseases (red boxes) for which both a gene (teal boxes) and a phenotype (white boxes) are known. Module <bold>(B)</bold>: a bipartite network was constructed and analysed to obtain the typical &#x201c;NMD co-occurring phenotypes&#x201d; that tended to occur in NMDs. Module <bold>(C)</bold>: a tripartite network enabled the obtention of new, significant phenotype-gene pairs that were translated to &#x201c;phenotype-function pairs&#x201d;. Module <bold>(D)</bold>: communities of highly related phenotypes were filtered based on shared function to obtain the final set of &#x201c;functionally coherent clusters of phenotypes in NMDs&#x201d;. PubMed co-mention was used to assess the reliability of the co-occurrence approach. Dark grey cylinders correspond to databases; yellow boxes are relevant analyses; inverted triangles indicate process merging; light grey rectangles are intermediate sets of results; coloured rectangles with text in bold mark relevant results.</p>
</caption>
<graphic xlink:href="fmolb-08-635074-g001.tif"/>
</fig>
<sec id="s2-1-1">
<title>2.1.1 Module A: NMD Datasets With Genes, Phenotypes and Typical NMD Phenotypes</title>
<p>The OMIM and Orphanet databases (as of 15th-Nov-2019) were used in parallel since they gather information from different origins and with different goals. OMIM was searched with NMD related keywords (<italic>muscular dystrophy, myopathy, myasthenic, myasthenia, neuropathy, amyotrophic lateral sclerosis, spinal muscular atrophy, spinal and bulbar muscular atrophy, myotonia, periodic paralysis, myotonic dystrophy, mitochondrial cytopathy, necrotizing encephalomyelopathy, mitochondrial DNA depletion</italic>) to obtain a list of NMDs as complete as possible. Since Orphanet organises diseases based on ORDO (Orphanet Rare Disease Ontology) (<xref ref-type="bibr" rid="B74">Vasant et&#x20;al., 2014</xref>), all diseases descendant of the category neuromuscular diseases (Orphanet:68381) were used. Hence, diseases in OMIM and Orphanet were assigned to &#x201c;All NMDs&#x201d; or &#x201c;All non-NMDs&#x201d; (grey rectangles in Module A of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref> and <xref ref-type="table" rid="T2">Table&#x20;2</xref>). These were used to query HPO (v1.2; 15th-Nov-2019) to retain only those diseases (&#x201c;Non-NMDs&#x201d; and &#x201c;NMDs&#x201d; in <xref ref-type="table" rid="T2">Table&#x20;2</xref>, corresponding to red rectangles in Module A of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) for which both phenotype (white rectangles in Module A of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) and gene (teal rectangles in Module A of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) information was available.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Summary of diseases found in OMIM and Orphanet databases and the retained diseases, phenotypes and genes after the HPO&#x20;query.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center"/>
<th colspan="3" align="center">OMIM</th>
<th colspan="3" align="center">Orphanet</th>
</tr>
<tr>
<th align="left"/>
<th align="left"/>
<th colspan="2" align="center">HPO</th>
<th align="left"/>
<th colspan="2" align="center">HPO</th>
</tr>
<tr>
<th align="left"/>
<th align="center">Diseases</th>
<th align="center">Phenotypes</th>
<th align="center">Genes</th>
<th align="center">Diseases</th>
<th align="center">Phenotypes</th>
<th align="center">Genes</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Total</td>
<td align="char" char=".">26 943</td>
<td align="char" char=".">-</td>
<td align="char" char=".">-</td>
<td align="char" char=".">3 431</td>
<td align="char" char=".">-</td>
<td align="char" char=".">-</td>
</tr>
<tr>
<td align="left">&#x2003;All non-NMDs</td>
<td align="char" char=".">26 387</td>
<td align="char" char=".">-</td>
<td align="char" char=".">-</td>
<td align="char" char=".">3 204</td>
<td align="char" char=".">-</td>
<td align="char" char=".">-</td>
</tr>
<tr>
<td align="left">&#x2003;All NMDs</td>
<td align="char" char=".">556</td>
<td align="char" char=".">-</td>
<td align="char" char=".">-</td>
<td align="char" char=".">227</td>
<td align="char" char=".">-</td>
<td align="char" char=".">-</td>
</tr>
<tr>
<td align="left">Complete information in HPO</td>
<td align="char" char=".">5189</td>
<td align="char" char=".">6385</td>
<td align="char" char=".">4015</td>
<td align="char" char=".">2020</td>
<td align="char" char=".">5430</td>
<td align="char" char=".">2730</td>
</tr>
<tr>
<td align="left">&#x2003;Non-NMDs</td>
<td align="char" char=".">4765</td>
<td align="char" char=".">6183</td>
<td align="char" char=".">4015</td>
<td align="char" char=".">1894</td>
<td align="char" char=".">5312</td>
<td align="char" char=".">2730</td>
</tr>
<tr>
<td align="left">&#x2003;NMDs</td>
<td align="char" char=".">424</td>
<td align="char" char=".">1314</td>
<td align="char" char=".">345</td>
<td align="char" char=".">126</td>
<td align="char" char=".">1007</td>
<td align="char" char=".">222</td>
</tr>
<tr>
<td align="left">&#x2003;Common</td>
<td align="char" char=".">0</td>
<td align="char" char=".">1112</td>
<td align="char" char=".">345</td>
<td align="char" char=".">0</td>
<td align="char" char=".">889</td>
<td align="char" char=".">222</td>
</tr>
<tr>
<td align="left">&#x2003;Typical in NMDs</td>
<td align="char" char=".">-</td>
<td align="char" char=".">335</td>
<td align="char" char=".">0</td>
<td align="char" char=".">-</td>
<td align="char" char=".">216</td>
<td align="char" char=".">0</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>&#x201c;-&#x201d;: not considered or not relevant for the analysis.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Finally, phenotype frequencies between &#x201c;NMDs&#x201d; and &#x201c;non-NMDs&#x201d; in <xref ref-type="table" rid="T2">Table&#x20;2</xref> and <xref ref-type="fig" rid="F1">Figure&#x20;1</xref> were compared using Fisher&#x2019;s exact test (one-tail) with a threshold of <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>0.05</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. A list of &#x201c;Typical NMD phenotypes&#x201d; (<xref ref-type="table" rid="T2">Table&#x20;2</xref> and <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) was thus obtained.</p>
</sec>
<sec id="s2-1-2">
<title>2.1.2 Module B: Bipartite Network to Obtain Phenotype Co-Occurrences</title>
<p>All diseases (&#x201c;NMDs&#x201d; and &#x201c;non-NMDs&#x201d;) as well as their corresponding phenotypes were used to construct a standard bipartite network (<xref ref-type="bibr" rid="B50">Pavlopoulos et&#x20;al., 2018</xref>) of disease-phenotype pairs to find common (co-occurring) phenotypes across diseases. Phenotype co-occurrences (grey rectangle in Module B of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) were extracted using <italic>NetAnalyzer</italic> (<xref ref-type="bibr" rid="B55">Rojano et&#x20;al., 2017</xref>) (see below). To recover only significant associations for NMDs (pale magenta rectangle of &#x201c;NMD co-occurring phenotypes&#x201d; in Module B of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>), all phenotype-phenotype co-occurrences were filtered using the &#x201c;Typical NMD phenotypes&#x201d; obtained from Module&#x20;A.</p>
</sec>
<sec id="s2-1-3">
<title>2.1.3 Module C: Tripartite Network to Obtain Phenotype-Function Pairs</title>
<p>A tripartite network of all diseases (NMDs and non-NMDs), their phenotypes and the affected genes was constructed to link, in first instance, phenotypes with genes, based on their co-occurrence across diseases. The network was constructed as described in (<xref ref-type="bibr" rid="B55">Rojano et&#x20;al., 2017</xref>) and then investigated using <italic>NetAnalyzer</italic> to find significant phenotype-gene co-occurrences (grey rectangle in Module C of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>). Phenotype-gene pairs were converted into phenotype-function pairs based on the biological process sub-ontology from Gene Ontology (GO), KEGG (Kyoto Encyclopaedia of Genes and Genomes) pathways and Reactome pathways. To reveal those enriched functions significantly associated with a given phenotype, all genes associated with that phenotype were obtained and this gene list was used for functional enrichment, based on over-representation analysis (<xref ref-type="bibr" rid="B78">Yu et&#x20;al., 2012</xref>). Association between phenotypes and genes/functions was performed separately for OMIM and Orphanet. This resulted in significant &#x201c;phenotype-function pairs&#x201d; (pale cyan rectangle in bold in Module C of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>).</p>
</sec>
<sec id="s2-1-4">
<title>2.1.4 Module D: Functionally-Coherent Clusters of Phenotypes in NMDs</title>
<p>The typical NMD phenotypes obtained in Module B were used to detect communities of related, highly interconnected phenotypes (grey rectangle at bottom centre of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) using the R package <italic>linkcomm</italic>. Following the rationale proposed in (<xref ref-type="bibr" rid="B15">D&#xed;az-Santiago et&#x20;al., 2020</xref>), phenotype communities for which at least 70% of the constituent phenotypes shared the same functional annotations obtained from the phenotype-function pairs of Module C were retained. These were considered &#x201c;functionally coherent clusters of phenotypes in NMDs&#x201d; (final dark rectangle in Module D of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) and constitute the major result of the workflow. OMIM clusters were tagged with &#x201c;&#x2a;&#x201d;, while Orphanet clusters were tagged with &#x201c;&#x23;&#x201d;.</p>
</sec>
</sec>
<sec id="s2-2">
<title>2.2 PubMed Co-Mention to Validate the Co-Occurrence Approach</title>
<p>Phenotypes co-occurring in NMDs from Module B and phenotype-function pairs from Module C were investigated in terms of co-mention in the scientific literature, by comparing how many PubMed abstracts mention both terms in a given pair, to how many abstracts mention only one of them. To do so, the NCBI Entrez Programming Utilities API was used as previously described (<xref ref-type="bibr" rid="B15">D&#xed;az-Santiago et&#x20;al., 2020</xref>). In brief, the different textual descriptions for a given i) phenotype as described in HPO, ii) GO term from the biological process vocabulary, iii) KEGG pathways, and iv) Reactome pathways, were retrieved. All these terms were queried separately in PubMed (the complete database) to obtain the lists of PMIDs (PubMed identifiers) of abstracts mentioning each given term. PMID lists were then compared for each pair of terms (phenotype-phenotype, phenotype-GO, phenotype-KEGG or phenotype-Reactome) using Fisher&#x2019;s exact test to detect the significantly (<inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>0.05</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>) co-mentioned pairs. The numbers of significant pairs obtained for each set was then compared to the number of significant pairs obtained from random models, by calculating whether the probability of finding as many significant pairs in the random dataset was at least as high as that detected using real&#x20;data.</p>
</sec>
<sec id="s2-3">
<title>2.3 Tissue Expression Testing</title>
<p>Genes in phenotype-gene associations were further analysed to see if they were more likely to be expressed in neuronal or muscular tissues, both highly relevant for NMDs. To do so, expression location of genes paired with NMD phenotypes was compared to that of genes paired with non-NMD phenotypes. Expression locations were obtained from the normal tissue expression dataset (<italic>normal_tissue.tsv.zip</italic> file) at The Human Protein Atlas version 20.0 (<xref ref-type="bibr" rid="B72">Uhl&#xe9;n et&#x20;al., 2015</xref>) (<ext-link ext-link-type="uri" xlink:href="http://www.proteinatlas.org">http://www.proteinatlas.org</ext-link>). A gene was considered as expressed in neuronal or muscular tissue if it showed medium or high expression in one of the following tissue types: cerebellum, cerebral cortex, hippocampus, caudate neuronal cells, skeletal muscle or heart muscle. The relative proportions of genes from each set that showed expression in neuronal or muscular tissue were compared using Fisher&#x2019;s exact&#x20;test.</p>
</sec>
<sec id="s2-4">
<title>2.4&#x20;<italic>PhenoClusters</italic> Architecture and Execution Details</title>
<p>All the above calculations have been implemented as an automated workflow named <italic>PhenoClusters</italic> that is based on <italic>PhenCo</italic> (<xref ref-type="bibr" rid="B15">D&#xed;az-Santiago et&#x20;al., 2020</xref>) and uses additional scripts from (<xref ref-type="bibr" rid="B28">Jabato et&#x20;al., 2020</xref>). The Picasso supercomputer of University of Malaga was used for code implementation and testing. It consists of an OpenSUSE LEAP 12.3 with Slurm queue system and Infiniband network (54/40 Gbps) containing 216 nodes with Intel E5-2670 2.6&#xa0;GHz cores for a total of 3&#x20;456 cores and 22&#xa0;TB of RAM. The code is available from GitHub at <ext-link ext-link-type="uri" xlink:href="https://github.com/Elenadisa/PhenoClusters">https://github.com/Elenadisa/PhenoClusters</ext-link>. The main requirements are Python 3, Ruby 2.4.1, R 4.0.0 or higher, Bioconductor 3.4 (<xref ref-type="bibr" rid="B26">Huber et&#x20;al., 2015</xref>) or higher, scripts from <italic>sys_bio_lab</italic> (<xref ref-type="bibr" rid="B28">Jabato et&#x20;al., 2020</xref>), and <italic>Anaconda Individual edition</italic> (<ext-link ext-link-type="uri" xlink:href="https://docs.anaconda.com/anaconda/install/">https://docs.anaconda.com/anaconda/install/</ext-link>) as package and environment manager. The workflow was managed using <italic>AutoFlow</italic> (<xref ref-type="bibr" rid="B63">Seoane et&#x20;al., 2016</xref>).</p>
<p>For co-occurrence analysis, <italic>PhenoClusters</italic> requires <italic>NetAnalyzer</italic> (<xref ref-type="bibr" rid="B55">Rojano et&#x20;al., 2017</xref>). Although many co-occurrence methods are available, previous work suggests that the hypergeometric index (<italic>HyI</italic>) (<xref ref-type="bibr" rid="B5">Fuxman Bass et&#x20;al., 2013</xref>), which can be considered analogous to a contingency table based approach, is the most suitable for co-occurrence studies (<xref ref-type="bibr" rid="B55">Rojano et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B11">Bueno et&#x20;al., 2018</xref>). Hence, <inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mi>y</mml:mi>
<mml:mi>I</mml:mi>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> was set to calculate associations within the layers of a network and obtain phenotype-phenotype or phenotype-gene associations that were considered significant co-occurrences (<xref ref-type="bibr" rid="B15">D&#xed;az-Santiago et&#x20;al., 2020</xref>).</p>
<p>Functional enrichment was performed using the genes associated with each phenotype. The Bioconductor package <italic>clusterProfiler</italic> 3.18.0 (<xref ref-type="bibr" rid="B78">Yu et&#x20;al., 2012</xref>) was used to extract the biological process subontology from GO and the KEGG pathways and conduct over-representation analysis for these resources. The Bioconductor package <italic>ReactomePA</italic> 1.34.0 (<xref ref-type="bibr" rid="B77">Yu and He, 2016</xref>) was used to extract Reactome pathway data and perform over-representation analysis for this resource. Both packages were executed with default parameters (<italic>pvalueCutoff</italic> &#x3d; <italic>0.05, pAdjustMethod</italic> &#x3d; &#x201c;<italic>BH</italic>&#x201d;<italic>, universe, qvalueCutoff</italic> &#x3d; <italic>0.2, minGSSize</italic> &#x3d; <italic>10, maxGSSize</italic> &#x3d; <italic>500</italic>) and only the assignments with <inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>0.05</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> after Benjamini-Hochberg multiple testing adjustment (<xref ref-type="bibr" rid="B8">Benjamini and Hochberg, 1995</xref>) were considered significant.</p>
<p>Highly interconnected phenotype communities were obtained using the R-CRAN package <italic>linkcomm</italic> 1.0.13 (<xref ref-type="bibr" rid="B29">Kalinka and Tomancak, 2011</xref>) with default parameters for undirected networks. R-CRAN packages required for graphical representations and data management are <italic>ggplot2</italic> 3.3.2, <italic>RColorBrewer</italic> 1.1.2, <italic>igraph</italic> 1.2.6, <italic>dplyr</italic> 1.0.2 and <italic>VennDiagram</italic> 1.6.20. The final, user-friendly HTML reports were produced using R markdown packages <italic>rmarkdown</italic> 2.6, <italic>knitr</italic> 1.30 and <italic>kableExtra</italic>&#x20;1.3.1.</p>
<p>Details about <italic>PhenoClusters</italic> execution can be found at <ext-link ext-link-type="uri" xlink:href="https://github.com/Elenadisa/PhenoClusters">https://github.com/Elenadisa/PhenoClusters</ext-link>. As can be seen, diseases from OMIM and Orphanet were considered separately in different scripts. One run usually takes at least 6&#xa0;h 45&#xa0;min without the co-mention verification, since literature analysis takes a very long, heterogeneous amount of time depending on the PubMed server overload. The resulting reports are named <italic>omim_report.html</italic> (<xref ref-type="sec" rid="s9">Supplementary Material S1</xref>) and <italic>orphanet_report.html</italic> (<xref ref-type="sec" rid="s9">Supplementary Material S2</xref>). To simplify cluster inspection, they are also saved as independent files in <italic>omim_clusters_report.html</italic> and <italic>orphanet_clusters_report.html</italic> including the cluster ID, the phenotype graph together with HPO IDs and descriptions, as well as the associated functions and the genes identified within them. Clusters showing functional coherence are given at the top of the file. For the sake of simplicity, &#x201c;&#x2a;&#x201d; is used to tag OMIM clusters, while Orphanet clusters are tagged by &#x201c;&#x23;&#x201d;, as indicated in Module&#x20;D.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Typical NMD Phenotypes Reflect Neuromotor Impairments</title>
<p>Diseases in OMIM and Orphanet were classified as NMD or non-NMD (<xref ref-type="table" rid="T2">Table&#x20;2</xref>). All downstream analysis treated the resources separately (<xref ref-type="sec" rid="s9">Supplementary Material S1, S2</xref>). The total numbers of diseases in each resource for which genes and pathological phenotype information was available are shown in <xref ref-type="table" rid="T2">Table&#x20;2</xref>; full details can be found in <xref ref-type="sec" rid="s9">Supplementary Material S3, S4</xref>. It can be seen that relatively few diseases were considered NMDs with known genes and phenotypes in HPO (424 and 125 in OMIM and Orphanet, respectively). Many phenotypes were shared by both NMDs and non-NMDs (row &#x201c;Common&#x201d; in <xref ref-type="table" rid="T2">Table&#x20;2</xref>). Fisher&#x2019;s exact test was then performed to compare the relative occurrence of each phenotype between disease groups to find those relatively more common in NMDs. This resulted in 335 and 216 typical NMD phenotypes for OMIM and Orphanet. Overlap between the two is shown in <xref ref-type="fig" rid="F2">Figure&#x20;2</xref>, where Panels B and C show that the proportion of common phenotypes in both sets increases with decreasing cutoff <italic>p</italic>-values. This reinforces the suitability of the co-occurrence approach to extract typical NMD phenotypes.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Common and distinct disease-associated HPO-phenotypes in OMIM and Orhpanet described in <xref ref-type="table" rid="T2">Table&#x20;2</xref>. <bold>(A)</bold>: Distribution of the 6&#x20;385 HPO phenotypes for OMIM and the 5&#x20;430 phenotypes for Orphanet for all NMDs and non-NMDs. <bold>(B)</bold>: Distribution of the typical 335 OMIM and 216 Orphanet phenotypes significantly (<inline-formula id="inf5">
<mml:math id="m5">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>0.05</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>) associated with NMDs. <bold>(C)</bold>: Same as B, but using the increased significance (<inline-formula id="inf6">
<mml:math id="m6">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>0.001</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>) NMD-associated phenotypes (172 for OMIM and 110 for Orphanet).</p>
</caption>
<graphic xlink:href="fmolb-08-635074-g002.tif"/>
</fig>
<p>The top over-represented phenotypes are shown in <xref ref-type="sec" rid="s9">Supplementary Material S5</xref>. The most significant in both resources is &#x2018;elevated serum creatine kinase&#x2019;, which reflects the important role of muscle decay in NMDs, given that the normal location of this enzyme is the cytoplasm and mitochondria, not serum (<xref ref-type="bibr" rid="B45">Moghadam-Kia et&#x20;al., 2016</xref>). This result is reassuring with respect to the approach of <italic>PhenoClusters</italic>, as elevated serum creatine kinase is routinely tested when diagnosing NMDs as a consequence of muscle injury (<xref ref-type="bibr" rid="B70">Thavorntanaburt et&#x20;al., 2018</xref>).</p>
<p>The top phenotypes (<xref ref-type="sec" rid="s9">Supplementary Material S5</xref>) seem to be more indicative of muscular impairment than neuronal dysfunction, pointing to proximal or distal muscular weakness, both very typical in the clinical history of NMD patients (<xref ref-type="bibr" rid="B41">McDonald, 2012</xref>; <xref ref-type="bibr" rid="B47">Mukherjee et&#x20;al., 2019</xref>). Other important phenotypes are related to specific diseases, such as Duchenne/Becker muscular dystrophy (&#x2018;calf muscle hypertrophy&#x2019;, &#x2018;Gowers sign&#x2019;), where muscle hypertrophy can exaggerate postural instability and joint contracture (<xref ref-type="bibr" rid="B33">Kornegay et&#x20;al., 2012</xref>). In contrast, the absence of &#x2018;hypotonia&#x2019;-related phenotypes in this top ten list is notable. However, it should be made clear that such phenotypes were also significantly over-represented among NMDs, just not included in the top ten (<xref ref-type="sec" rid="s9">Supplementary Material S3, S4</xref>). To conclude, the <italic>PhenoClusters</italic> approach to obtain statistically over-represented phenotypes for NMDs extracts phenotypes characteristic of these disorders.</p>
</sec>
<sec id="s3-2">
<title>3.2 Typical NMD Phenotypes Tend to Co-Occur Across Diseases</title>
<p>Bipartite networks were created (one for OMIM diseases and another for Orphanet), with nodes representing diseases and phenotypes, and edges representing known relations in OMIM or Orphanet respectively. The network was analysed to identify pairs of typical NMD phenotypes that tend co-occur across diseases (Module B in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>). Around a quarter of all phenotype pairs co-occurring in at least one disease showed significant co-occurrence (27.61% in OMIM and 21.20% in Orphanet). Only a small subset (&#x2264;1 %) of all phenotype pairs represent significant co-occurrence between NMD phenotypes. However, this value was far lower for the random sets of non-NMD phenotypes, being almost negligible (<xref ref-type="table" rid="T3">Table&#x20;3</xref>), showing that pairs of NMD phenotypes are far more likely to significantly co-occur across multiple diseases than pairs of randomly selected phenotypes. These results point to the presence of comorbidity between NMD phenotypes.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Numbers of pairs of co-occurring phenotypes for the OMIM and Orphanet databases. Significantly co-occurring pairs defined as having a hypergeometric index value <inline-formula id="inf7">
<mml:math id="m7">
<mml:mrow>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Category</th>
<th align="center">OMIM</th>
<th align="center">Orphanet</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Total co-occurring phenotype pairs</td>
<td align="char" char=".">455 379</td>
<td align="char" char=".">467 899</td>
</tr>
<tr>
<td align="left">Significant co-occurring pairs (<inline-formula id="inf8">
<mml:math id="m8">
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mi>y</mml:mi>
<mml:mi>I</mml:mi>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>)</td>
<td align="char" char=".">125 720</td>
<td align="char" char=".">99 193</td>
</tr>
<tr>
<td align="left">Significant co-occurring pairs, NMD phenotypes</td>
<td align="char" char=".">4 579</td>
<td align="char" char=".">2 314</td>
</tr>
<tr>
<td align="left">Significant co-occurring pairs, non-NMD phenotypes<xref ref-type="table-fn" rid="Tfn1">
<italic>
<sup>a</sup>
</italic>
</xref>
</td>
<td align="center">
<inline-formula id="inf9">
<mml:math id="m9">
<mml:mrow>
<mml:mn>655</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>46.4</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf10">
<mml:math id="m10">
<mml:mrow>
<mml:mn>173</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>16.43</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn1">
<label>
<sup>a</sup>
</label>
<p>This result is expressed as the average&#x20;&#xb1; SD for 100 sets of 335 randomly chosen OMIM non-NMD phenotypes and 216 random Orphanet non-NMD phenotypes; the non-NMD phenotypes were selected to have a similar prevalence to the NMD phenotypes.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3-3">
<title>3.3&#x20;Co-Occurring Phenotypes Tend to be Co-Mentioned in Research Papers</title>
<p>As well as showing that the typical NMD phenotypes tended to co-occur across diseases much more frequently than non-NMD phenotypes, further validation was performed based on co-mention analysis for each phenotype pair within PubMed abstracts. The NMD phenotype pairs were shown to be co-mentioned in the literature much more frequently than equal numbers of pairs of randomly chosen non-NMD phenotypes (<xref ref-type="table" rid="T3">Table&#x20;3</xref>). Fisher&#x2019;s exact test analysis revealed that 1&#x20;173 OMIM pairs and 689 Orphanet pairs (<xref ref-type="sec" rid="s9">Supplementary Tables S1, S2</xref>) were significantly co-mentioned. Conversely, for non-NMDs, the numbers of significant pairs were much lower (<inline-formula id="inf11">
<mml:math id="m11">
<mml:mrow>
<mml:mn>333.08</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>34.63</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> in OMIM and <inline-formula id="inf12">
<mml:math id="m12">
<mml:mrow>
<mml:mn>110.0</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>13.47</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> in Orphanet, <xref ref-type="sec" rid="s9">Supplementary Tables S1, S2</xref>, respectively). These differences were also supported by the distribution of their <italic>p</italic>-values (<xref ref-type="sec" rid="s9">Supplementary Figures S1, S2</xref>) that were clearly more dense at <inline-formula id="inf13">
<mml:math id="m13">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>0.05</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> for NMDs than in non-NMDs. These results demonstrate the validity of the <italic>PhenoClusters</italic> approach to find pairs of NMD-related phenotypes that tend to co-occur together.</p>
</sec>
<sec id="s3-4">
<title>3.4&#x20;Phenotype-Function Associations are Robust</title>
<p>Associations between NMD phenotypes and genes and functions were calculated in order to uncover potential underlying mechanisms leading to the expression of a pathological phenotype. This was done by initially connecting phenotypes with genes using a tripartite network based approach (Module C in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) by combining all disease-phenotype pairs and all disease-gene pairs in OMIM and Orphanet separately. The networks were then analysed in order to connect genes with phenotypes based on co-occurrence across multiple diseases.</p>
<p>Using a threshold of <inline-formula id="inf14">
<mml:math id="m14">
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mi>y</mml:mi>
<mml:mi>I</mml:mi>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, 34&#x20;139 and 36&#x20;218&#x20;phenotype-gene associations were obtained for OMIM and Orphanet, respectively; from these, a total of 1&#x20;078 and 611 distinct genes were associated with NMD phenotypes, respectively. There was significant overlap between OMIM and Orphanet in terms of genes associated with NMD phenotypes (<inline-formula id="inf15">
<mml:math id="m15">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>2.2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, Fisher&#x2019;s exact test using all phenotype-associated genes as background). Moreover, a significantly greater proportion of the NMD associated genes (84.41% in OMIM, 86.73% in Orphanet) were shown to be expressed in neuronal or muscle tissue than the non-NMD associated genes (70.32% in OMIM. 72.88% in Orphanet), which is a statistically significant difference (<inline-formula id="inf16">
<mml:math id="m16">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>2.2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf17">
<mml:math id="m17">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>6.3</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>11</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, for OMIM and Orphanet, respectively). The same kind of test was performed for the remaining non-relevant tissues, revealing in this case that there was no significant difference between NMD and non-NMD genes after a Fisher&#x2019;s test (<inline-formula id="inf18">
<mml:math id="m18">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x3e;</mml:mo>
<mml:mn>0.9</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> for both databases).</p>
<p>The genes associated with each phenotype were then used for functional enrichment analysis using <italic>clusterprofiler</italic> and <italic>ReactomePA</italic> to find over-represented (<inline-formula id="inf19">
<mml:math id="m19">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>0.05</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>) GO terms (biological process ontology), and KEGG and Reactome pathways (<xref ref-type="table" rid="T4">Table&#x20;4</xref>). As with gene-based analysis, there was significant overlap between OMIM and Orphanet (<inline-formula id="inf20">
<mml:math id="m20">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>2.2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mn>6.842</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>8</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf21">
<mml:math id="m21">
<mml:mrow>
<mml:mn>2.381</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>14</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, respectively, using Fisher&#x2019;s exact test with all phenotype-associated functions used as background). <xref ref-type="sec" rid="s9">Supplementary Material S6</xref> shows the overlap between the different resources using Venn diagrams. Therefore, genes associated with NMD phenotypes are significantly expressed in neuronal and muscle tissue, the most relevant for NMDs, supporting the robustness of the phenotype-function pairs obtained by <italic>PhenoClusters</italic>.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Numbers of genes and functions associated with phenotypes. Total: all genes in each dataset. &#x201c;Any&#x201d;: genes/functions associated with any phenotype. &#x201c;Only NMD&#x201d;: genes/functions associated with a typical NMD phenotype.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left" colspan="1">Feature</th>
<th colspan="4" align="center">OMIM-based</th>
<th colspan="4" align="center">Orphanet-based</th>
<th colspan="4" align="center">OMIM-Orphanet overlap</th>
</tr>
<tr>
<th align="left"/>
<th align="center">Genes</th>
<th align="center">GOs</th>
<th align="center">KEGG</th>
<th align="center">Reac</th>
<th align="center">Genes</th>
<th align="center">GOs</th>
<th align="center">KEGG</th>
<th align="center">Reac</th>
<th align="center">Genes</th>
<th align="center">GOs</th>
<th align="center">KEGG</th>
<th align="center">Reac</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Total</td>
<td align="center">4015</td>
<td align="center">-</td>
<td align="center">-</td>
<td align="center">-</td>
<td align="center">2730</td>
<td align="center">-</td>
<td align="center">-</td>
<td align="center">-</td>
<td align="center">2452</td>
<td align="center">-</td>
<td align="center">-</td>
<td align="center">-</td>
</tr>
<tr>
<td align="left">Any</td>
<td align="center">3870</td>
<td align="center">6398</td>
<td align="center">214</td>
<td align="center">1397</td>
<td align="center">2700</td>
<td align="center">6281</td>
<td align="center">209</td>
<td align="center">1356</td>
<td align="center">2374</td>
<td align="center">6260</td>
<td align="center">208</td>
<td align="center">1348</td>
</tr>
<tr>
<td align="left">Only NMD</td>
<td align="center">1078</td>
<td align="center">3747</td>
<td align="center">142</td>
<td align="center">821</td>
<td align="center">611</td>
<td align="center">3618</td>
<td align="center">123</td>
<td align="center">631</td>
<td align="center">360</td>
<td align="center">2666</td>
<td align="center">102</td>
<td align="center">451</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>&#x201c;-&#x201d;: not considered or relevant in the analysis.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>In spite of the robustness of these novel associations between phenotypes and functions, additional validation was performed based on co-mention analysis using PubMed abstracts as a sign of relevance. Term co-occurrence of a given phenotype alongside its corresponding function was looked for within the same abstract (<xref ref-type="sec" rid="s9">Supplementary Figures S1, S2</xref>). Only a subset of the phenotype-function pairs obtained from the network were significantly co-mentioned (&#x201c;Confirmed&#x201d; columns in <xref ref-type="table" rid="T5">Table&#x20;5</xref>). However, this subset was several times larger than the number of co-mentioned pairs within the &#x201c;random&#x201d; pairs, and this difference was significant for all comparisons (<inline-formula id="inf22">
<mml:math id="m22">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>2.2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>) using Fisher&#x2019;s exact test. Consistent results were found for both OMIM and Orphanet: respectively i) 5% and 4% of phenotype-GO pairs, ii) 10.5% and 9% of KEGG pairs, and iii) 4% and 3% of Reactome pairs were significantly co-mentioned. As such, <italic>PhenoClusters</italic> (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) appears to produce robust and reliable associations between NMD phenotypes and functions based on phenotype and gene co-occurrence across diseases. Even though only a small fraction could be confirmed in PubMed abstracts, this was several times more than would be expected by chance. The analysis showed much higher co-mention for the KEGG associations as a proportion of the total pairs. This supports our previous work suggesting that information in KEGG is more reliable for functional studies in certain situations (<xref ref-type="bibr" rid="B38">Luque-Baena et&#x20;al., 2014</xref>).</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Co-mention validation of phenotype-function pairs. &#x201c;All&#x201d; corresponds to all pairs including a function from <xref ref-type="table" rid="T4">Table&#x20;4</xref>. &#x201c;Confirmed&#x201d; refers to the number of these pairs that were significantly co-mentioned in PubMed. &#x201c;Random&#x201d; refers to the number of pairs in a randomised list based on &#x201c;All&#x201d; pairs that were significantly co-mentioned in PubMed; average of 100 random datasets&#x20;&#xb1; SD is shown in this&#x20;case.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left" colspan="1">Paired</th>
<th colspan="6" align="center">Phenotypes</th>
</tr>
<tr>
<th align="left" colspan="1">function</th>
<th colspan="3" align="center">OMIM</th>
<th colspan="3" align="center">Orphanet</th>
</tr>
<tr>
<th align="left"/>
<th align="center">All</th>
<th align="center">Confirmed</th>
<th align="center">Random<xref ref-type="table-fn" rid="Tfn2">
<sup>a</sup>
</xref>
</th>
<th align="center">All</th>
<th align="center">Confirmed</th>
<th align="center">Random<xref ref-type="table-fn" rid="Tfn2">
<sup>a</sup>
</xref>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">GO</td>
<td align="char" char=".">567 721</td>
<td align="char" char=".">26 841</td>
<td align="center">
<inline-formula id="inf23">
<mml:math id="m23">
<mml:mrow>
<mml:mn>10</mml:mn>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mn>814</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>80.5</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="char" char=".">535 389</td>
<td align="char" char=".">21 863</td>
<td align="center">
<inline-formula id="inf24">
<mml:math id="m24">
<mml:mrow>
<mml:mn>9</mml:mn>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mn>613</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>93.4</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="left">KEGG</td>
<td align="char" char=".">17 679</td>
<td align="char" char=".">1 858</td>
<td align="center">
<inline-formula id="inf25">
<mml:math id="m25">
<mml:mrow>
<mml:mn>627</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>22.1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="char" char=".">17 104</td>
<td align="char" char=".">1 556</td>
<td align="center">
<inline-formula id="inf26">
<mml:math id="m26">
<mml:mrow>
<mml:mn>628</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>21.2</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="left">Reactome</td>
<td align="char" char=".">82 826</td>
<td align="char" char=".">3 278</td>
<td align="center">
<inline-formula id="inf27">
<mml:math id="m27">
<mml:mrow>
<mml:mn>1001</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>166.3</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="char" char=".">78 409</td>
<td align="char" char=".">2 402</td>
<td align="center">
<inline-formula id="inf28">
<mml:math id="m28">
<mml:mrow>
<mml:mn>816</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>28.7</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn2">
<label>
<sup>a</sup>
</label>
<p>The randomised phenotype-function pair set was formed by shuffling the links between the pairs in each list, keeping the total number of links per phenotype/function unchanged. This sampling procedure was repeated to produce 100 different replicas of randomised phenotype-function pairs. These sets were used in the corresponding Fisher&#x2019;s exact&#x20;tests.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3-5">
<title>3.5 Clusters Formed Between NMD Phenotypes are Functionally Coherent</title>
<p>The pairs of significantly co-occurring NMD phenotypes (pale magenta rectangle of Module B in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) were processed to extract communities of highly interconnected phenotypes (Module D in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>). As summarised in <xref ref-type="table" rid="T6">Table&#x20;6</xref>, the number of communities and average number of phenotypes per community is higher using the modules based on NMD phenotypes compared to non-NMDs. This indicates that the co-occurring NMD phenotypes tend to form groups of related phenotypes.</p>
<table-wrap id="T6" position="float">
<label>TABLE 6</label>
<caption>
<p>Overview of communities (numbers and average sizes) generated with the co-occurrent phenotype pairs for OMIM and Orphanet. Values shown for communities obtained using pairs of NMD phenotypes and equal numbers of randomly generated pairs of non-NMD phenotypes (average&#x20;&#xb1; SD).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left" colspan="1">Community</th>
<th colspan="2" align="center">OMIM</th>
<th colspan="2" align="center">Orphanet</th>
</tr>
<tr>
<th align="left"/>
<th align="center">NMD</th>
<th align="center">non-NMD<xref ref-type="table" rid="T6">
<sup>a</sup>
</xref>
</th>
<th align="center">NMD</th>
<th align="center">non-NMD<xref ref-type="table" rid="T6">
<sup>a</sup>
</xref>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Total number</td>
<td align="char" char=".">231</td>
<td align="center">
<inline-formula id="inf29">
<mml:math id="m29">
<mml:mrow>
<mml:mn>94.98</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>9.6</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="char" char=".">150</td>
<td align="center">
<inline-formula id="inf30">
<mml:math id="m30">
<mml:mrow>
<mml:mn>23.85</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>4.293</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="left">Phenotypes per community</td>
<td align="char" char=".">16.75</td>
<td align="center">
<inline-formula id="inf31">
<mml:math id="m31">
<mml:mrow>
<mml:mn>5.55</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>0.6</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="char" char=".">13.63</td>
<td align="center">
<inline-formula id="inf32">
<mml:math id="m32">
<mml:mrow>
<mml:mn>4.15</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>0.278</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="left">Functionally coherent clusters</td>
<td align="char" char=".">40</td>
<td align="center">
<inline-formula id="inf33">
<mml:math id="m33">
<mml:mrow>
<mml:mn>41.21</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>7.72</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="char" char=".">72</td>
<td align="center">
<inline-formula id="inf34">
<mml:math id="m34">
<mml:mrow>
<mml:mn>14.51</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>3.189</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn3">
<label>
<sup>a</sup>
</label>
<p>&#x2018;non-NMD&#x2019; results correspond to the grouping obtained using the 100 random sets described in <xref ref-type="table" rid="T3">Table&#x20;3</xref>.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The phenotype communities were combined with the phenotype-function associations obtained previously (light cyan rectangle of Module C in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) to evaluate their functional coherence. In total, 40 OMIM communities and 72 Orphanet communities (<xref ref-type="table" rid="T6">Table&#x20;6</xref>) showed coherent function, defined as having shared functional enrichment for at least 70% of their constituent phenotypes; they constituted the &#x201c;functionally coherent clusters&#x201d;. The complete list of functionally coherent clusters is provided at the end of the reports given in <xref ref-type="sec" rid="s9">Supplementary Material S1, S2</xref>. In terms of cluster properties, some have high interconnection (&#x2a;193, &#x2a;138, &#x2a;219, &#x23;115, &#x23;150), others show spoke-hub structure, with a central node connected to a number of other nodes which do not then connect to each other (clusters &#x2a;58, &#x2a;1, &#x2a;3, &#x2a;4, &#x2a;91, &#x2a;26, &#x23;144, &#x23;2, &#x23;3, &#x23;21, &#x23;60, &#x23;22), and others have near linear topology (&#x2a;146, &#x2a;85, &#x23;97). Compared to their respective random non-NMD models <xref ref-type="table" rid="T6">Table&#x20;6</xref>, OMIM presents a similar number of clusters, in stark contrast with Orphanet, for which 5&#x20;times more clusters were found. The coherence threshold must be decreased to 50% to find a substantially different number of coherent clusters in OMIM compared to the random datasets (<xref ref-type="sec" rid="s9">Supplementary Figure S1</xref>), This difference may be due to the OMIM clusters being larger than for Orphanet (16.75 vs. 13.63 phenotypes, respectively) or related to the nature of the diseases considered NMDs in each dataset. These results support the approach presented here in which the information from the different databases is considered separately, with Orphanet arguably providing more confident results with respect to how well the typical NMD phenotypes in these clusters represent realistic and useful groupings of co-occurrent phenotypes that reflect co-morbidity with shared underlying cellular functions.</p>
</sec>
<sec id="s3-6">
<title>3.6 Clinical Application I: Functionally Coherent Clusters Help Direct Diagnosis</title>
<p>The functionally coherent clusters found by our approach (<xref ref-type="sec" rid="s9">Supplementary Material S1, S2</xref>) were inspected by clinicians with expertise in paediatric neuromuscular diseases, finding clusters with sets of expected phenotypes for NMDs, and others with unexpected phenotypes. Clusters are grouped in <xref ref-type="table" rid="T7">Table&#x20;7</xref> based on the area in which the constituent phenotypes manifest, followed by further subdivision by group of NMD. Since they represent direct links between NMDs, their symptoms and their underlying mechanisms, they could be used for clinical diagnosis, by suggesting novel phenotypes to test for, should a patient present other phenotypes within a cluster. They also suggest potentially affected genes, useful for directing genetic analysis, and potentially affected functions. Although this analysis necessarily has a subjective aspect, given that clinicians differ in training and experience, it is remarkable that <italic>PhenoClusters</italic> produces functionally coherent clusters easily recognised by clinicians. In summary, there are multiple clusters that fit in with our current knowledge about NMDs as shown in <xref ref-type="table" rid="T7">Table&#x20;7</xref>, which reinforces once again the coherence of the results generated by the presented approach.</p>
<table-wrap id="T7" position="float">
<label>TABLE 7</label>
<caption>
<p>Known associations between NMDs, clusters and underlying cell function, sorted by topological and pathophysiological levels.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Topological or pathophysiological level</th>
<th align="center">Group of NMD</th>
<th align="center">Cluster ID: main cell function involved<xref ref-type="table-fn" rid="Tfn4">
<sup>a</sup>
</xref>
</th>
<th align="center">References</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td colspan="4" align="left">
<italic>Peripheral nervous system</italic>
</td>
</tr>
<tr>
<td rowspan="2" align="left">2<sup>nd</sup> motor neuron in the anterior horn of the spinal cord</td>
<td rowspan="2" align="left">Spinal muscular atrophy</td>
<td align="left">&#x2a;82: R-HSA-191859 snRNP Assembly</td>
<td rowspan="2" align="left">
<xref ref-type="bibr" rid="B6">B&#xe4;umer et&#x20;al. (2009)</xref>, <xref ref-type="bibr" rid="B56">Rossoll and Bassell (2009)</xref>
</td>
</tr>
<tr>
<td align="left">&#x2a;82: R-HSA-194441 Metabolism of non-coding RNA</td>
</tr>
<tr>
<td rowspan="5" align="left">Peripheral nerve</td>
<td rowspan="5" align="left">Peripheral neuropathies</td>
<td align="left">&#x2a;3: GO:0042552 &#x2013; myelination</td>
<td rowspan="5" align="left">
<xref ref-type="bibr" rid="B30">Kamil et&#x20;al. (2019)</xref>, <xref ref-type="bibr" rid="B83">Zhou and Notterpek (2016)</xref>
</td>
</tr>
<tr>
<td align="left">&#x2a;23: GO:0008366 &#x2013; axon ensheathment</td>
</tr>
<tr>
<td align="left">&#x2a;67: GO:0042552 &#x2013; myelination</td>
</tr>
<tr>
<td align="left">&#x2a;200: GO:0008366 &#x2013; axon ensheathment</td>
</tr>
<tr>
<td align="left">&#x2a;47: GO:0008366 &#x2013; axon ensheathment</td>
</tr>
<tr>
<td rowspan="3" align="left">Neuromuscular junction</td>
<td rowspan="3" align="left">Myasthenic syndromes</td>
<td align="left">&#x2a;97: GO:0007274 &#x2013; neuromuscular synaptic transmission</td>
<td rowspan="3" align="left">
<xref ref-type="bibr" rid="B54">Rodr&#xed;guez Cruz et&#x20;al. (2018)</xref>, <xref ref-type="bibr" rid="B66">Souza et&#x20;al. (2016)</xref>
</td>
</tr>
<tr>
<td align="left">&#x2a;166: GO:0007271 &#x2013; synaptic transmission, cholinergic</td>
</tr>
<tr>
<td align="left">&#x2a;166: GO:0007528 &#x2013; neuromuscular junction development</td>
</tr>
<tr>
<td rowspan="11" align="left">Muscle</td>
<td rowspan="3" align="left">Congenital or developmental myopathies</td>
<td align="left">&#x2a;15: GO:0048747 &#x2013; muscle fiber development</td>
<td rowspan="3" align="left">
<xref ref-type="bibr" rid="B59">Sarnat (1994)</xref>, <xref ref-type="bibr" rid="B12">Cassandrini et&#x20;al. (2017)</xref>
</td>
</tr>
<tr>
<td align="left">&#x2a;6: GO:0051146 &#x2013; striated muscle cell differentiation</td>
</tr>
<tr>
<td align="left">&#x2a;6: GO:0048747 &#x2013; muscle fiber development</td>
</tr>
<tr>
<td align="left">Myotonic syndromes/dystrophies</td>
<td align="left">&#x2a;193: GO:0003012 &#x2013; muscle system process</td>
<td align="left">
<xref ref-type="bibr" rid="B42">Meola and Cardani (2015)</xref>
</td>
</tr>
<tr>
<td rowspan="7" align="left">Muscular dystrophies (non-congenital)</td>
<td align="left">&#x23;13: GO:0048747 &#x2013; muscle fiber development</td>
<td rowspan="7" align="left">
<xref ref-type="bibr" rid="B37">Lovering et&#x20;al. (2005)</xref>
</td>
</tr>
<tr>
<td align="left">&#x23;13: GO:0007517 &#x2013; muscle organ development</td>
</tr>
<tr>
<td align="left">&#x23;112: GO:0007517 &#x2013; muscle organ development</td>
</tr>
<tr>
<td align="left">&#x23;112: GO:0048747 &#x2013; muscle fiber development</td>
</tr>
<tr>
<td align="left">&#x23;60: hsa05414 &#x2013; dilated cardiomyopathy</td>
</tr>
<tr>
<td align="left">&#x23;60: hsa05410 &#x2013; hypertrophic cardiomyopathy</td>
</tr>
<tr>
<td align="left">&#x23;60: R-HSA-390522 &#x2013; Striated Muscle Contraction</td>
</tr>
<tr>
<td colspan="4" align="left">
<italic>Mitochondrial target</italic>
</td>
</tr>
<tr>
<td align="left">Mitochondrial genome maintenance</td>
<td align="left">Mitochondrial myopathy or disease</td>
<td align="left">&#x2a;205: GO:0000002 &#x2013; mitochondrial genome maintenance</td>
<td rowspan="4" align="left">
<xref ref-type="bibr" rid="B51">Pfeffer and Chinnery (2013)</xref>
</td>
</tr>
<tr>
<td rowspan="3" align="left">Mitochondrial inheritance</td>
<td rowspan="3" align="left">Mitochondrial myopathy or disease</td>
<td align="left">&#x2a;48: GO:0006119 &#x2013; oxidative phosphorylation</td>
</tr>
<tr>
<td align="left">&#x2a;48: GO:0022900 &#x2013; electron transport chain</td>
</tr>
<tr>
<td align="left">&#x2a;48: GO:0045333 &#x2013; cellular respiration</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn4">
<label>
<sup>a</sup>
</label>
<p>&#x201c;&#x2a;&#x201d; tag for OMIM clusters. &#x201c;&#x23;&#x201d; tag for Orphanet clusters.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3-7">
<title>3.7 Clinical Application II: Unexpected Phenotypic Relationships in NMDs</title>
<p>Other clusters provided by <italic>PhenoClusters</italic> contained more unusual groupings of phenotypes. Clinicians were surprised by the presence of &#x2018;macroglossia&#x2019; (HP:0000158) and &#x2018;arthogryposis&#x2019; (HP:0002804) (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>). Macroglossia is usually associated with non-neuromuscular syndromes and in metabolic disorders such as glycogen storage disease type II (Pompe disease), mucopolysaccharidosis, oligosaccharidosis, mucolipidoses, sphingolipidoses and galactosidosis. However, macroglossia appeared as a hub node in the cluster &#x2a;58 (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>), strongly associated with highly representative NMD phenotypes, such as &#x2018;congenital muscular dystrophy&#x2019; and &#x2018;achilles tendon contracture&#x2019;. This phenotype also appears in clusters &#x2a;26, and &#x2a;53, with macroglossia occupying a peripheral position (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>). In macroglossia-containing clusters, 70%&#x2013;80% of phenotypes show significant enrichment for the &#x201c;protein <italic>O</italic>-linked mannosylation&#x201d; biological process (GO:0035269), suggesting that the clinical observation of macroglossia in patients with NMDs may prompt practitioners to ask for <italic>O</italic>-linked mannosylation tests. This contrasts with cluster &#x2a;211 (<xref ref-type="sec" rid="s9">Supplementary Material S1</xref>) that also contains congenital muscular dystrophy and ankle flexion contracture, as well as &#x2018;increased endomysial connective tissue&#x2019;, but not macroglossia, the functions for this cluster being &#x2018;focal adhesion&#x2019; (hsa04510) and &#x2018;ECM proteoglycans&#x2019; (R-HSA-3000178) but not &#x201c;protein <italic>O</italic>-linked mannosylation&#x201d;. Hence, cluster &#x2a;211 seems to be related to processes involved in physically connecting (&#x2018;focal adhesion&#x2019;) cells to the extracellular matrix (&#x2018;ECM proteoglycans&#x2019;). Therefore, functionally related clusters may help to discriminate disorders presenting with the macroglossia phenotype from other muscular dystrophies caused by the disruption of other cell functions. This finding shows the potential clinical utility of our approach to identify phenotypes whose presence alongside a given set of other phenotypes can indicate distinct underlying processes, with implications for diagnosis and treatment.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Example clusters including the unexpected but key macroglossia (HP:0000158) and arthrogryposis multiplex congenita (HP:0002804) phenotypes identified in OMIM and Orphanet, respectively. These phenotypes are marked in red boxes. The relevance of these phenotypes for differential diagnosis is further described in the&#x20;text.</p>
</caption>
<graphic xlink:href="fmolb-08-635074-g003.tif"/>
</fig>
<p>&#x2018;Arthogryposis&#x2019; represents another phenotype of potential use for NMD diagnosis (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>). Arthrogryposis multiplex congenita consists of contractures in multiple body areas (<xref ref-type="bibr" rid="B1">Ambegaonkar et&#x20;al., 2011</xref>). Cluster &#x23;117 shows a range of clinical phenotypes with arthrogryposis as the central node (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>), while &#x23;59 and &#x23;88 are cases where this phenotype appears in a peripheral position. Interestingly, cluster &#x23;115 (<xref ref-type="sec" rid="s9">Supplementary Material S2</xref>) presents almost all phenotypes observed in cluster &#x23;117, except arthogryposis. Hence, it can be inferred that when arthogryposis is present, the pathways associated with the majority of phenotypes in the cluster are more specific to muscle fibre-related processes including contraction dysfunction. However, when arthogryposis is absent, the cluster phenotypes share additional pathways related to cardio-myopathies and the regulation of pseudopodium assembly, indicating a broader aetiology in the genetic systems involved. As such, the presence or absence of arthogryposis alongside other symptoms may help inform NMD diagnosis and treatment, by indicating distinct underlying processes.</p>
</sec>
<sec id="s3-8">
<title>3.8 Research and Clinical Application: Clarifying Gene Involvement</title>
<p>The genes underlying the enriched functions were further investigated. It was noted that some of them occur in multiple clusters but are linked to different functions depending on the affected phenotypes. For example, <italic>DAG1</italic> is a pivotal component of the dystrophin-glycoprotein complex and its dysfunction is related to many muscular dystrophies, amongst other diseases (<xref ref-type="bibr" rid="B17">Durbeej et&#x20;al., 1998</xref>; <xref ref-type="bibr" rid="B60">Sciandra et&#x20;al., 2003</xref>). It can be considered a pleiotropic gene due to its role in glycosylation, a process which is involved in myriad cellular functions. For NMDs, it seems that glycosylation pathways are affected when <italic>DAG1</italic> appears in clusters &#x2a;1, &#x23;29 and &#x23;113, in agreement with previous studies (<xref ref-type="bibr" rid="B4">Barresi and Campbell, 2006</xref>). However, the involvement of <italic>DAG1</italic> in clusters &#x2a;198, &#x23;2, &#x23;144, &#x23;112, &#x23;103, &#x23;118, &#x23;11, &#x23;89 and &#x23;63 (<xref ref-type="sec" rid="s9">Supplementary Material S1, S2</xref>), appears to be related to cardiomyopathy (<xref ref-type="bibr" rid="B44">Michele et&#x20;al., 2009</xref>), while it is more focused on &#x2018;ECM proteoglycan components&#x2019; in cluster &#x2a;211. Hence, depending on the cluster in which <italic>DAG1</italic> appears, it seems to be involved in different pathways and functions, showing how <italic>PhenoClusters</italic> facilitates the identification of genes with multiple putative roles in NMDs depending on context.</p>
<p>Other clusters suggest that members of the solute carrier (SLC) family can perform many roles within NMDs. SLCs mediate the transport of a wide range of essential nutrients and metabolites, performing many different functions in cells and tissues (<xref ref-type="bibr" rid="B80">Zhang et&#x20;al., 2019</xref>). SLC proteins were found to be associated with nutrient supply in cluster &#x23;93; metabolic transformation in clusters &#x2a;85, &#x2a;128, and &#x2a;218; energy homeostasis in cluster &#x2a;138; oxidative stress in cluster &#x2a;205; and neurological regulation in clusters &#x2a;97 and &#x2a;166. These findings show how the phenotypic components of the functionally coherent clusters defined using <italic>PhenoClusters</italic> can point to the disruption of different cell functions in relation to NMDs involving genes from the SLC protein family.</p>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussion</title>
<sec id="s4-1">
<title>4.1 PhenoClusters Generates Reproducible Results and can be Extended to Other Diseases</title>
<p>As the use of bioinformatics analysis becomes more routine within biomedicine, it is crucial that published studies are accompanied by workflows that allow the analysis to be recorded and reported in a reproducible manner that can be applied to similar datasets, if applicable. <italic>PhenoClusters</italic> is based on phenotype co-occurrence, incorporating randomisation using matched non-NMD phenotypes to generate control datasets and including literature co-mention for validation of the approach. It also uses known NMD-causing genes to provide functional support to the co-occurring phenotypes. It produces a HTML report that can be easily interpreted, following the proposed Reproducible Research System (<xref ref-type="bibr" rid="B43">Mesirov, 2010</xref>; <xref ref-type="bibr" rid="B52">Piccolo and Frampton, 2016</xref>). Although there are many articles in the bioinformatics and systems biology fields presenting modular software tools and packages, in many cases code and data are not provided, despite the importance of reproducible research in health sciences (<xref ref-type="bibr" rid="B22">Harris et&#x20;al., 2018</xref>). As it is essential for the present study, the necessary code to conduct the workflow as described in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref> has been provided in full. Since the analysis starts by downloading diseases from OMIM and Orphanet, it can be adapted to study phenotype/gene/function co-occurrences in other diseases. <italic>PhenoClusters</italic> is thus an example of the re-analysis of previously published data using a new approach that produces new results and confirms already known facts. As such, it has achieved the goals of reproducible research (<xref ref-type="bibr" rid="B43">Mesirov, 2010</xref>; <xref ref-type="bibr" rid="B52">Piccolo and Frampton, 2016</xref>) in the health sciences (<xref ref-type="bibr" rid="B22">Harris et&#x20;al., 2018</xref>) and exploiting already published results (<xref ref-type="bibr" rid="B34">Kovalevskaya et&#x20;al., 2016</xref>).</p>
</sec>
<sec id="s4-2">
<title>4.2 Network Analyses Should Rely on More Than One Database</title>
<p>
<italic>PhenoClusters</italic> did not mix data from OMIM and Orphanet based on two main facts. The first one is that OMIM and Orphanet are populated in different ways. For example, the variability of the phenotypic series of OMIM was high, with PS253600 (muscular dystrophy, limb-girdle, autosomal recessive) presenting 28 entries, while PS118220 (Charcot-Marie-Tooth disease) has 70 entries. The second one is that OMIM was searched with somewhat arbitrary keywords, whilst Orphanet NMDs were obtained based on its ontology structure. As a result, there are more OMIM-specific phenotypes and less Orphanet-specific phenotypes (<xref ref-type="fig" rid="F2">Figure&#x20;2</xref>), and fewer functionally coherent clusters in OMIM than in Orphanet (<xref ref-type="table" rid="T6">Table&#x20;6</xref>). Besides these discrepancies, both databases rendered a similar ratio of shared phenotype pairs (<xref ref-type="table" rid="T3">Table&#x20;3</xref>) and the same top specific phenotype for NMDs, &#x2018;elevated serum creatine kinase&#x2019; (<xref ref-type="sec" rid="s9">Supplementary Material S5</xref>), in agreement with the importance of the creatine kinase test often used in NMD diagnosis (<xref ref-type="bibr" rid="B70">Thavorntanaburt et&#x20;al., 2018</xref>). Other common phenotypes include muscle weakness, contractures, altered gait, functional difficulties, and respiratory issues, in agreement with recognised phenotypes for these diseases (<xref ref-type="bibr" rid="B48">Norwood et&#x20;al., 2009</xref>). However, the interesting phenotypes &#x2018;macroglossia&#x2019; and &#x2018;arthogryposis&#x2019; (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>) emerged from database-specific group of phenotypes. In any case, despite the mentioned discrepancies, it is striking that, when the phenotypes were associated with genes and functions, there was high overlap (<xref ref-type="table" rid="T4">Table&#x20;4</xref>, <xref ref-type="sec" rid="s9">Supplementary Material S6</xref>). Therefore, we believe it is preferable to use the information from OMIM and Orphanet separately and to compare to contrast the results.</p>
<p>Co-mention validation in <xref ref-type="table" rid="T5">Table&#x20;5</xref> revealed that even though GO contains many terms to describe biological functions and Reactome contains more pathway descriptions than KEGG, 2-fold more phenotype-KEGG pathway pairs (percentage-wise) were validated by literature co-mention. Moreover, when comparing functional annotation between OMIM and Orphanet, a proportionally larger overlap was found between the two resources for KEGG pathways (<xref ref-type="sec" rid="s9">Supplementary Material S6</xref>). These findings supports our previous finding that KEGG produces better bioinformatic models in genetic algorithms for clinical diagnosis and prognosis (<xref ref-type="bibr" rid="B38">Luque-Baena et&#x20;al., 2014</xref>), as well as for the outcome of diseases (<xref ref-type="bibr" rid="B73">Urda et&#x20;al., 2018</xref>). Hence, KEGG pathways should always be considered in functional analyses.</p>
</sec>
<sec id="s4-3">
<title>4.3&#x20;Co-Occurrences and Associations Appear Consistent</title>
<p>Due to the etiological heterogeneity of NMDs, each disease is defined by its own set of clinical phenotypes. Phenotypes serve to understand life and disease, but it is not always easy to translate them to molecular mechanisms and vice versa (<xref ref-type="bibr" rid="B79">Yu et&#x20;al., 2016</xref>). Taking advantage of the huge amount of data available in databases, bipartite networks (phenotype-disease, disease-gene) have been used in biomedicine to model factors that influence human diseases, explore their molecular complexity, reveal novel molecular relationships and disease susceptibility genes, uncover the biological significance of disease-associated mutations (<xref ref-type="bibr" rid="B50">Pavlopoulos et&#x20;al., 2018</xref>) and, more recently, discover phenotype/disease clusters that can predict protein-phenotype associations and reveal the underlying mechanisms that link them (<xref ref-type="bibr" rid="B53">Ren et&#x20;al., 2020</xref>). Bipartite gene-disease network analysis was revolutionised with the diseasome and related studies (<xref ref-type="bibr" rid="B19">Goh et&#x20;al., 2007</xref>) which showed that genes associated with similar disease phenotypes have a higher propensity to interact physically with each other, forming distinct disease-specific functional modules, and that disorders tend to form clusters on the basis of similar pathophysiology (<xref ref-type="bibr" rid="B49">Oti and Brunner, 2007</xref>). Other studies revealed that phenotypes and gene co-regulation accurately predict unknown disease-gene relations (<xref ref-type="bibr" rid="B14">Deelen et&#x20;al., 2019</xref>) since genes causing a specific disease or disease symptom often have similar molecular functions or are involved in the same biological process or pathway.</p>
<p>With all these facts in mind, the systems biology approach implemented in <italic>PhenoClusters</italic> lies in bipartite and tripartite networks (Modules B and C in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>) to extract co-occurring phenotypes in NMDs (<xref ref-type="sec" rid="s9">Supplementary Material S3, S4</xref>) that were consistent with i) clinical histories (<xref ref-type="bibr" rid="B48">Norwood et&#x20;al., 2009</xref>) (<xref ref-type="table" rid="T7">Table&#x20;7</xref>), ii) creatine kinase tests (<xref ref-type="bibr" rid="B45">Moghadam-Kia et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B70">Thavorntanaburt et&#x20;al., 2018</xref>) (<xref ref-type="sec" rid="s9">Supplementary Material S5</xref>), iii) proximal or distal muscular weakness (<xref ref-type="bibr" rid="B41">McDonald, 2012</xref>; <xref ref-type="bibr" rid="B47">Mukherjee et&#x20;al., 2019</xref>), and iv) postural instability and joint contracture (<xref ref-type="bibr" rid="B33">Kornegay et&#x20;al., 2012</xref>), as usually found in the clinical history of NMD patients. The genes significantly associated with NMDs by <italic>PhenoClusters</italic> were largely expressed in neuronal and/or muscle-related tissues. For those that were not, it is tempting to speculate that this is due to incomplete information in The Human Protein Atlas, however it may also indicate genes involved in development or other regulatory processes that lead to the manifestation of the NMD phenotypes. There is currently much interest in the relationship between tissue/cell-type specificity and disease progression (<xref ref-type="bibr" rid="B23">Hekselman and Yeger-Lotem, 2020</xref>). Functional enrichment of the NMD-associated genes was used to provide phenotype-function associations that were then combined with the co-occurrent phenotype communities to produce functionally coherent clusters. Gene-to-function translation reduced the degrees of freedom of the analysis (several genes were required to assign a significantly enriched function to a phenotype), increasing statistical power and allowing the detection of shared functions between phenotypes, even if the underlying genes differ. The comparison of NMD-specific associations with randomised data in <xref ref-type="table" rid="T3">Tables 3</xref>, <xref ref-type="table" rid="T4">4</xref>, <xref ref-type="table" rid="T6">6</xref> demonstrates that the findings were well-founded, as discussed&#x20;below.</p>
</sec>
<sec id="s4-4">
<title>4.4&#x20;Co-Mention in Abstracts is a Valuable Approach Validation</title>
<p>There is an absence of gold-standard datasets for phenotypic relationships, particularly for rare diseases. As such, <xref ref-type="bibr" rid="B53">Ren et&#x20;al. (2020)</xref> applied systems biology methods to obtain phenotype/disease clusters to seed machine learning models to predict protein-phenotype associations without any objective validation, assuming that they were relevant since authors can find biological support for some of the clusters. Here, abstract co-mention was proposed as a source of external validation for phenotype-phenotype and phenotype-function pairing approach. There were far fewer co-mentions for randomly paired terms than for specific pairs (<xref ref-type="table" rid="T5">Table&#x20;5</xref>), even though only a small fraction of phenotype-phenotype and phenotype-function pairs (<inline-formula id="inf35">
<mml:math id="m35">
<mml:mrow>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>10</mml:mn>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>%</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> in the second) showed significant co-mention in the literature. This is likely due to a combination of the following reasons: 1) term relationship existed, although not yet described in literature; 2) the co-mention appeared in the main body, but not in abstracts, of articles; 3) phenotypes were co-mentioned with genes rather than functions; and 4) abstract co-mention existed, but using slightly different terms or natural language synonyms that escape the search. In any case, these issues also apply to the randomised/non-NMD associations. In conclusion, although the abstract co-mention is not perfect, the fact that the amount of significant literature co-mention was much higher for NMD-specific pairs than controls (<xref ref-type="table" rid="T5">Table&#x20;5</xref>) shows it to provide suitable validation of the described approach and that real relationships were&#x20;found.</p>
</sec>
<sec id="s4-5">
<title>4.5 Functionally Related Clusters Provide Insight Into NMDs</title>
<p>Many <italic>PhenoClusters</italic> clusters are in clear agreement with current medical knowledge about the relationships between phenotype comorbidity, NMDs, their pathophysiology and genetic causes (<xref ref-type="table" rid="T7">Table&#x20;7</xref>). This serves to further support the bioinformatic approach presented here. Regarding differential diagnosis and treatment, the clusters for which the presence/absence of a specific phenotype (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>) could change the nature of the associated functions are particularly interesting: these have potential applications for differential diagnosis and treatment selection. As such, &#x2018;macroglossia&#x2019; can be used to identify <italic>O</italic>-mannosylation alterations in a given NMD dysfunction (<xref ref-type="bibr" rid="B67">Spence et&#x20;al., 2002</xref>; <xref ref-type="bibr" rid="B39">Martin, 2007</xref>; <xref ref-type="bibr" rid="B46">Moore and Winder, 2010</xref>; <xref ref-type="bibr" rid="B16">Dobson et&#x20;al., 2013</xref>; <xref ref-type="bibr" rid="B20">Goody et&#x20;al., 2015</xref>), while &#x2018;arthogryposis&#x2019; (<xref ref-type="bibr" rid="B1">Ambegaonkar et&#x20;al., 2011</xref>) may facilitate NMD diagnosis in other situations, as its presence may indicates that the disease is more specific to muscle fibres and contraction dysfunction.</p>
<p>The advantages of using functions rather than genes only is particularly evident in the findings related to pleiotropic genes and gene families involved in multiple functions. <italic>DAG1</italic> is involved in many diseases because it participates in glycosylation, whose malfunction affects many cellular processes and can produce several NMDs (<xref ref-type="bibr" rid="B17">Durbeej et&#x20;al., 1998</xref>; <xref ref-type="bibr" rid="B60">Sciandra et&#x20;al., 2003</xref>). However, its specific involvement in the proteoglycan components of the ECM seems to be related to cardiomyopathy. Additionally, despite the clear relevance to health and disease of the 190 different SLCs found mutated in human diseases, it is considered an understudied family (<xref ref-type="bibr" rid="B13">C&#xe9;sar-Razquin et&#x20;al., 2015</xref>). Functionally related clusters from <italic>PhenoClusters</italic> reveal which particular role can be putatively assigned to the present members of the SLC family. Taken together, these results encourage future research lines directed to systematically exploit co-occurrence and clusters of co-occurrent phenotypes and functions in other diseases, as well as further study of a number of presented clusters to obtain more details on the functional implications.</p>
</sec>
<sec id="s4-6">
<title>4.6 Clinical Implications of Clusters</title>
<p>It has been shown that functionally coherent clusters have potential utility in NMDs in terms of better understanding clinical presentation in these diseases and obtaining clues as to the underlying molecular genetic mechanisms. The former has important implications for diagnosis and patient classification; the latter will help researchers better understand these diseases and search for potential new therapeutic targets.</p>
<p>Their potential for diagnosis is clear: given a patient that presents a number of phenotypes corresponding to one of the clusters, one can make inferences about other clinical phenotypes that the patient may also suffer and that should be tested for. This will help obtain a better clinical profile for the patient, aiding diagnosis. Moreover, genes and functional terms associated with the same cluster can be of use for guiding genetic diagnosis and indicate further pathological examination. For example, multiple clusters in the peripheral neuropathy group in <xref ref-type="table" rid="T7">Table&#x20;7</xref> contain phenotypes associated with myelination and axon ensheathment related genes (<xref ref-type="bibr" rid="B83">Zhou and Notterpek, 2016</xref>; <xref ref-type="bibr" rid="B30">Kamil et&#x20;al., 2019</xref>). As such, given a patient showing phenotypes belonging to one of these clusters, but for whom full diagnosis has not yet been achieved, the clinician could refer the patient for the appropriate assays, such as MRI, to look for demyelination and guide genetic studies to focus on related&#x20;genes.</p>
<p>A further clinical application is related to differential diagnosis based on the phenotypic profile presented by a patient. The presence/absence of phenotypes &#x2018;macroglossia&#x2019; and &#x2018;arthogryposis&#x2019; (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>) has been thoroughly explained as examples of phenotypes indicating differing underlying mechanisms that lead to disease manifestation. However, many other examples undoubtedly exist among the clusters presented in <xref ref-type="sec" rid="s9">Supplementary Material S1,&#x20;S2</xref>.</p>
<p>Nevertheless, there are several limitations in our bioinformatic approach, largely related to the external databases from which the information is acquired. OMIM and Orphanet are both incomplete resources: there are undoubtedly multiple diseases suffered by people around the world whose description and genetic basis have not made their way into these databases. This means that we are likely to miss co-occurrent phenotypes as the diseases in which they co-occur have not yet been added. Similarly, the resources used for functional enrichment analysis, used to ascribe function to the NMD phenotypes in this study, are also incomplete. We do not yet know the function of all genes in the genome, and this has effects on the enrichment procedures. As these resources improve, the potential of our workflow to find clusters of co-occurrent phenotypes and fully characterise their underlying basis will no doubt improve with them. However, regarding the information of clusters, this approach can only extract functions from genes known to be involved in NMDs, and cannot hypothesise about other genes even if they are working in the same pathway. And as already mentioned above, there is a limitation concerning literature co-mention validation (<xref ref-type="table" rid="T5">Table&#x20;5</xref>), as a higher proportion of confirmed pairs it would be desirable.</p>
<p>In conclusion, our approach and the resultant functionally coherent clusters of NMD phenotypes (<xref ref-type="sec" rid="s9">Supplementary Material S1, S2</xref>) can 1) relate phenotype co-occurrence across NMDs to the underlying genes and mechanisms involved in the NMD (or other diseases); 2) provide clinicians with hints about clinical tests to produce a more reliable diagnosis based on the presence or absence of some specific phenotypes that have not yet been reported by the patient or the clinician, in the comorbidity context of the patient; 3) give researchers clues to perform new experiments to discover the underlying biological mechanisms of a disease; and 4) help in selecting optimal treatment. Therefore, <italic>PhenoClusters</italic> can be considered a new tool for more accurate diagnosis and an advance towards personalised medicine for&#x20;NMDs.</p>
</sec>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s9">Supplementary Material</xref>, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>ED-S conducted the formal analysis and investigation, produces the resources and software, as well as validation and visualisations. MC structured the work, improved the reports and wrote the final manuscript. RY, YD, RC, JH, and FP interpreted the functionally coherent clusters and reviewed the manuscript. JR obtained the founding sources, administrates the project and conceptualised the analysis. JP performs the data curation, investigated the results, selected the methodology, produced the original draft and edited the English wording. JR and JP contributed equally to the research.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>The study was funded by grants from the Andalusian Government (Junta de Andalucia) with European Regional Development Fund UMA18-FEDERJA-102; the Ram&#xf3;n Areces foundation, which funds project for the investigation of rare disease (National call for research on life and material sciences, XIX edition); the Spanish Ministry of Science and Innovation with European Regional Development Fund PID2019-108096RB-C21; and the Ram&#xf3;n y Cajal I3 projects through the Research Plan of the University of Malaga (Ayudas del I Plan Propio).</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<ack>
<p>The CIBERER is an initiative from the Carlos III Health Institute (Instituto de Salud Carlos III; ISCIII). The authors thank the Supercomputing and Bioinnovation Center (SCBI) at the University of Malaga for their provision of computational resources and technical support (<ext-link ext-link-type="uri" xlink:href="http://www.scbi.uma.es/">http://www.scbi.uma.es/</ext-link>).</p>
</ack>
<sec id="s9">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmolb.2021.635074/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmolb.2021.635074/full&#x23;supplementary-material</ext-link>.</p>
<supplementary-material xlink:href="DataSheet1.zip" id="SM1" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<sec id="s10">
<title>Abbreviations</title>
<p>ECM, extracellular matrix; GO, gene ontology; HPO, human phenotype ontology; HyI, hypergeometric index; KEGG, kyoto encyclopedia of genes and genomes; MD, muscular dystrophy; NMD, neuromuscular disease; non-NMD, non-neuromuscular disease; OMIM, online Mendelian inheritance in man; PMID, pubMed identifier; SLC, solute carrier.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ambegaonkar</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Manzur</surname>
<given-names>A. Y.</given-names>
</name>
<name>
<surname>Robb</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Kinali</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Muntoni</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The multiple phenotypes of arthrogryposis multiplex congenita with reference to the neurogenic variant</article-title>. <source>Eur. J.&#x20;Paediatr. Neurol.</source> <volume>15</volume>, <fpage>316</fpage>&#x2013;<lpage>319</lpage>. <pub-id pub-id-type="doi">10.1016/j.ejpn.2011.01.007</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Amberger</surname>
<given-names>J.&#x20;S.</given-names>
</name>
<name>
<surname>Bocchini</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Scott</surname>
<given-names>A. F.</given-names>
</name>
<name>
<surname>Hamosh</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Omim.org: leveraging knowledge across phenotype-gene relationships</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume>, <fpage>D1038</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gky1151</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bagley</surname>
<given-names>S. C.</given-names>
</name>
<name>
<surname>Sirota</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Butte</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Altman</surname>
<given-names>R. B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Constraints on biological mechanism from disease comorbidity using electronic medical records and database of genetic variants</article-title>. <source>PLoS Comput. Biol.</source> <volume>12</volume>, <fpage>e1004885</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1004885</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Barresi</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Campbell</surname>
<given-names>K. P.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Dystroglycan: from biosynthesis to pathogenesis of human disease</article-title>. <source>J.&#x20;Cell Sci.</source> <volume>119</volume>, <fpage>199</fpage>&#x2013;<lpage>207</lpage>. <pub-id pub-id-type="doi">10.1242/jcs.02814</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bass</surname>
<given-names>J.&#x20;I. F.</given-names>
</name>
<name>
<surname>Diallo</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nelson</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Soto</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Myers</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Walhout</surname>
<given-names>A. J.&#x20;M.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Using networks to measure similarity between genes: association index selection</article-title>. <source>Nat. Methods</source> <volume>10</volume>, <fpage>1169</fpage>&#x2013;<lpage>1176</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.2728</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>B&#xe4;umer</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Nicholson</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Davies</surname>
<given-names>J.&#x20;L.</given-names>
</name>
<name>
<surname>Parkinson</surname>
<given-names>N. J.</given-names>
</name>
<name>
<surname>Murray</surname>
<given-names>L. M.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Alternative splicing events are a late feature of pathology in a mouse model of spinal muscular atrophy</article-title>. <source>PLoS Genet.</source> <volume>5</volume>, <fpage>e1000773</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1000773</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Benarroch</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Bonne</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Rivier</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Hamroun</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The 2020 version of the gene table of neuromuscular disorders (nuclear genome)</article-title>. <source>Neuromuscul. Disord.</source> <volume>29</volume>, <fpage>980</fpage>. <pub-id pub-id-type="doi">10.1016/j.nmd.2019.10.010</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Benjamini</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hochberg</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Controlling the false discovery rate: a practical and powerful approach to multiple testing</article-title>. <source>J.&#x20;R. Stat. Soc. Series B Stat. Methodol.</source> <volume>57</volume>, <fpage>289</fpage>&#x2013;<lpage>300</lpage>. <pub-id pub-id-type="doi">10.1111/j.2517-6161.1995.tb02031.x</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Birgmeier</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Haeussler</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Deisseroth</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Steinberg</surname>
<given-names>E. H.</given-names>
</name>
<name>
<surname>Jagadeesh</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Ratner</surname>
<given-names>A. J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>AMELIE speeds Mendelian diagnosis by matching patient phenotype and genotype to primary literature</article-title>. <source>Sci. Transl. Med.</source> <volume>12</volume>, <fpage>eaau9113</fpage>. <pub-id pub-id-type="doi">10.1126/scitranslmed.aau9113</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brown</surname>
<given-names>T. L.</given-names>
</name>
<name>
<surname>Meloche</surname>
<given-names>T. M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Exome sequencing a review of new strategies for rare genomic disease research</article-title>. <source>Genomics</source> <volume>108</volume>, <fpage>109</fpage>&#x2013;<lpage>114</lpage>. <pub-id pub-id-type="doi">10.1016/j.ygeno.2016.06.003</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bueno</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Rodr&#xed;guez-L&#xf3;pez</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Reyes-Palomares</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Rojano</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Corpas</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nevado</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Phenotype-loci associations in networks of patients with rare disorders: application to assist in the diagnosis of novel clinical cases</article-title>. <source>Eur. J.&#x20;Hum. Genet.</source> <volume>26</volume>, <fpage>1451</fpage>&#x2013;<lpage>1461</lpage>. <pub-id pub-id-type="doi">10.1038/s41431-018-0139-x</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cassandrini</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Trovato</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Rubegni</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lenzi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Fiorillo</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Baldacci</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Congenital myopathies: clinical phenotypes and new diagnostic tools</article-title>. <source>Ital. J.&#x20;Pediatr.</source> <volume>43</volume>, <fpage>101</fpage>. <pub-id pub-id-type="doi">10.1186/s13052-017-0419-z</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>C&#xe9;sar-Razquin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Snijder</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Frappier-Brinton</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Isserlin</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Gyimesi</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Bai</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>A call for systematic research on solute carriers</article-title>. <source>Cell</source> <volume>162</volume>, <fpage>478</fpage>&#x2013;<lpage>487</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2015.07.022</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Deelen</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>van Dam</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Herkert</surname>
<given-names>J.&#x20;C.</given-names>
</name>
<name>
<surname>Karjalainen</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Brugge</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Abbott</surname>
<given-names>K. M.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Improving the diagnostic yield of exome- sequencing by predicting gene-phenotype associations using large-scale gene expression analysis</article-title>. <source>Nat. Commun.</source> <volume>10</volume>, <fpage>2837</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-019-10649-4</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>D&#xed;az-Santiago</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Jabato</surname>
<given-names>F. M.</given-names>
</name>
<name>
<surname>Rojano</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Seoane</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Pazos</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Perkins</surname>
<given-names>J.&#x20;R.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Phenotype-genotype comorbidity analysis of patients with rare disorders provides insight into their pathological and molecular bases</article-title>. <source>PLoS Genet.</source> <volume>16</volume>, <fpage>e1009054</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1009054</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dobson</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Hempel</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Stalnaker</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Stuart</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wells</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>O-mannosylation and human disease</article-title>. <source>Cell. Mol. Life Sci.</source> <volume>70</volume>, <fpage>2849</fpage>&#x2013;<lpage>2857</lpage>. <pub-id pub-id-type="doi">10.1007/s00018-012-1193-0</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Durbeej</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Henry</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Campbell</surname>
<given-names>K. P.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Dystroglycan in development and disease</article-title>. <source>Curr. Opin. Cell Biol.</source> <volume>10</volume>, <fpage>594</fpage>&#x2013;<lpage>601</lpage>. <pub-id pub-id-type="doi">10.1016/s0955-0674(98)80034-3</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Firth</surname>
<given-names>H. V.</given-names>
</name>
<name>
<surname>Richards</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Bevan</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Clayton</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Corpas</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Rajan</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Decipher: database of chromosomal imbalance and phenotype in humans using ensembl resources</article-title>. <source>Am. J.&#x20;Hum. Genet.</source> <volume>84</volume>, <fpage>524</fpage>&#x2013;<lpage>533</lpage>. <pub-id pub-id-type="doi">10.1016/j.ajhg.2009.03.010</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goh</surname>
<given-names>K.-I.</given-names>
</name>
<name>
<surname>Cusick</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Valle</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Childs</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Vidal</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Barab&#xe1;si</surname>
<given-names>A.-L.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>The human disease network</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>104</volume>, <fpage>8685</fpage>&#x2013;<lpage>8690</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0701361104</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goody</surname>
<given-names>M. F.</given-names>
</name>
<name>
<surname>Sher</surname>
<given-names>R. B.</given-names>
</name>
<name>
<surname>Henry</surname>
<given-names>C. A.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Hanging on for the ride: adhesion to the extracellular matrix mediates cellular responses in skeletal muscle morphogenesis and disease</article-title>. <source>Dev. Biol.</source> <volume>401</volume>, <fpage>75</fpage>&#x2013;<lpage>91</lpage>. <pub-id pub-id-type="doi">10.1016/j.ydbio.2015.01.002</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hamosh</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Online Mendelian inheritance in man (OMIM), a knowledgebase of human genes and genetic disorders</article-title>. <source>Nucleic Acids Res.</source> <volume>33</volume>, <fpage>D514</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gki033</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Harris</surname>
<given-names>J.&#x20;K.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>K. J.</given-names>
</name>
<name>
<surname>Carothers</surname>
<given-names>B. J.</given-names>
</name>
<name>
<surname>Combs</surname>
<given-names>T. B.</given-names>
</name>
<name>
<surname>Luke</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Use of reproducible research practices in public health: a survey of public health analysts</article-title>. <source>PLoS One</source> <volume>13</volume>, <fpage>e0202447</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0202447</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hekselman</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Yeger-Lotem</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Mechanisms of tissue and cell-type specificity in heritable traits and diseases</article-title>. <source>Nat. Rev. Genet.</source> <volume>21</volume>, <fpage>137</fpage>&#x2013;<lpage>150</lpage>. <pub-id pub-id-type="doi">10.1038/s41576-019-0200-9</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hidalgo</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Blumm</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Barab&#xe1;si</surname>
<given-names>A.-L.</given-names>
</name>
<name>
<surname>Christakis</surname>
<given-names>N. A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>A dynamic network approach for the study of human phenotypes</article-title>. <source>PLoS Comput. Biol.</source> <volume>5</volume>, <fpage>e1000353</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1000353</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoehndorf</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Schofield</surname>
<given-names>P. N.</given-names>
</name>
<name>
<surname>Gkoutos</surname>
<given-names>G. V.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>The role of ontologies in biological and biomedical research: a functional perspective</article-title>. <source>Brief. Bioinform.</source> <volume>16</volume>, <fpage>1069</fpage>&#x2013;<lpage>1080</lpage>. <pub-id pub-id-type="doi">10.1093/bib/bbv011</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huber</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Carey</surname>
<given-names>V. J.</given-names>
</name>
<name>
<surname>Gentleman</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Anders</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Carlson</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Carvalho</surname>
<given-names>B. S.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Orchestrating high-throughput genomic analysis with bioconductor</article-title>. <source>Nat. Methods</source> <volume>12</volume>, <fpage>115</fpage>&#x2013;<lpage>121</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.3252</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hwang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Atluri</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Dey</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>V.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Co-clustering phenome-genome for phenotype classification and disease gene discovery</article-title>. <source>Nucleic Acids Res.</source> <volume>40</volume>, <fpage>e146</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gks615</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jabato</surname>
<given-names>F. M.</given-names>
</name>
<name>
<surname>Seoane</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Perkins</surname>
<given-names>J.&#x20;R.</given-names>
</name>
<name>
<surname>Rojano</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Garc&#xed;a Moreno</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Chagoyen</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Systematic identification of genetic systems associated with phenotypes in patients with rare genomic copy number variations</article-title>. <source>Hum. Genet.</source> <volume>140</volume>, <fpage>457</fpage>. <pub-id pub-id-type="doi">10.1007/s00439-020-02214-7</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kalinka</surname>
<given-names>A. T.</given-names>
</name>
<name>
<surname>Tomancak</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Linkcomm: an R package for the generation, visualization, and analysis of link communities in networks of arbitrary size and type</article-title>. <source>Bioinformatics</source> <volume>27</volume>, <fpage>2011</fpage>&#x2013;<lpage>2012</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr311</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kamil</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Yazid</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Idrus</surname>
<given-names>R. B. H.</given-names>
</name>
<name>
<surname>Das</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Peripheral demyelinating diseases: from biology to translational medicine</article-title>. <source>Front. Neurol.</source> <volume>10</volume>, <fpage>87</fpage>. <pub-id pub-id-type="doi">10.3389/fneur.2019.00087</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>K&#xf6;hler</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gargano</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Matentzoglu</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Carmody</surname>
<given-names>L. C.</given-names>
</name>
<name>
<surname>Lewis-Smith</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Vasilevsky</surname>
<given-names>N. A.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>The human phenotype ontology in 2021</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>D1207</fpage>&#x2013;<lpage>D1217</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa1043</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>K&#xf6;hler</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Schulz</surname>
<given-names>M. H.</given-names>
</name>
<name>
<surname>Krawitz</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Bauer</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>D&#xf6;lken</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ott</surname>
<given-names>C. E.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Clinical diagnostics in human genetics with semantic similarity searches in ontologies</article-title>. <source>Am. J.&#x20;Hum. Genet.</source> <volume>85</volume>, <fpage>457</fpage>. <pub-id pub-id-type="doi">10.1016/j.ajhg.2009.09.003</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kornegay</surname>
<given-names>J.&#x20;N.</given-names>
</name>
<name>
<surname>Childers</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Bogan</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Bogan</surname>
<given-names>J.&#x20;R.</given-names>
</name>
<name>
<surname>Nghiem</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>The paradox of muscle hypertrophy in muscular dystrophy</article-title>. <source>Phys. Med. Rehabil. Clin. N. Am.</source> <volume>23</volume>, <fpage>149</fpage>&#x2013;<lpage>172</lpage>. <pub-id pub-id-type="doi">10.1016/j.pmr.2011.11.014</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kovalevskaya</surname>
<given-names>N. V.</given-names>
</name>
<name>
<surname>Whicher</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Richardson</surname>
<given-names>T. D.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Grajciarova</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cardama</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Dnadigest and repositive: connecting the world of genomic data</article-title>. <source>PLoS Biol.</source> <volume>14</volume>, <fpage>e1002418</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pbio.1002418</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kraker</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zivkovi&#x107;</surname>
<given-names>S. A.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Autoimmune neuromuscular disorders</article-title>. <source>Curr. Neuropharmacol.</source> <volume>9</volume>, <fpage>400</fpage>&#x2013;<lpage>408</lpage>. <pub-id pub-id-type="doi">10.2174/157015911796558000</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Laing</surname>
<given-names>N. G.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Genetics of neuromuscular disorders</article-title>. <source>Crit. Rev. Clin. Lab. Sci.</source> <volume>49</volume>, <fpage>33</fpage>&#x2013;<lpage>48</lpage>. <pub-id pub-id-type="doi">10.3109/10408363.2012.658906</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lovering</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Porter</surname>
<given-names>N. C.</given-names>
</name>
<name>
<surname>Bloch</surname>
<given-names>R. J.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>The muscular dystrophies: from genes to therapies</article-title>. <source>Phys. Ther.</source> <volume>85</volume>, <fpage>1372</fpage>&#x2013;<lpage>1388</lpage>. <pub-id pub-id-type="doi">10.1093/ptj/85.12.1372</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luque-Baena</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Urda</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Gonzalo Claros</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Franco</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Jerez</surname>
<given-names>J.&#x20;M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Robust gene signatures from microarray data using genetic algorithms enriched with biological pathway keywords</article-title>. <source>J.&#x20;Biomed. Inform.</source> <volume>49</volume>, <fpage>32</fpage>&#x2013;<lpage>44</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbi.2014.01.006</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Martin</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Congenital muscular dystrophies involving the o-mannose pathway</article-title>. <source>Curr. Mol. Med.</source> <volume>7</volume>, <fpage>417</fpage>&#x2013;<lpage>425</lpage>. <pub-id pub-id-type="doi">10.2174/156652407780831601</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mccormack</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Woods</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Aartsma-Rus</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hagger</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Herczegfalvi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Heslop</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Guidance in social and ethical issues related to clinical, diagnostic care and novel therapies for hereditary neuromuscular rare diseases: &#x201c;translating&#x201d; the translational</article-title>. <source>PLoS Curr.</source> <volume>5</volume>, <fpage>1</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1371/currents.md.f90b49429fa814bd26c5b22b13d773ec</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McDonald</surname>
<given-names>C. M.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Clinical approach to the diagnostic evaluation of hereditary and acquired neuromuscular diseases</article-title>. <source>Phys. Med. Rehabil. Clin. N. Am.</source> <volume>23</volume>, <fpage>495</fpage>&#x2013;<lpage>563</lpage>. <pub-id pub-id-type="doi">10.1016/j.pmr.2012.06.011</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Meola</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Cardani</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Myotonic dystrophies: an update on clinical aspects, genetic, pathology, and molecular pathomechanisms</article-title>. <source>Biochim. Biophys. Acta Mol. Basis Dis.</source> <volume>1852</volume>, <fpage>594</fpage>&#x2013;<lpage>606</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbadis.2014.05.019</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mesirov</surname>
<given-names>J.&#x20;P.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Computer science. accessible reproducible research</article-title>. <source>Science</source> <volume>327</volume>, <fpage>415</fpage>&#x2013;<lpage>416</lpage>. <pub-id pub-id-type="doi">10.1126/science.1179653</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Michele</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Kabaeva</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Weiss</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Campbell</surname>
<given-names>K. P.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Dystroglycan matrix receptor function in cardiac myocytes is important for limiting activity-induced myocardial damage</article-title>. <source>Circ. Res.</source> <volume>105</volume>, <fpage>984</fpage>&#x2013;<lpage>993</lpage>. <pub-id pub-id-type="doi">10.1161/CIRCRESAHA.109.199489</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moghadam-Kia</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Oddis</surname>
<given-names>C. V.</given-names>
</name>
<name>
<surname>Aggarwal</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Approach to asymptomatic creatine kinase elevation</article-title>. <source>Cleve. Clin. J.&#x20;Med.</source> <volume>83</volume>, <fpage>37</fpage>&#x2013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.3949/ccjm.83a.14120</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moore</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Winder</surname>
<given-names>S. J.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Dystroglycan versatility in cell adhesion: a tale of multiple motifs</article-title>. <source>Cell Commun. Signal.</source> <volume>8</volume>, <fpage>3</fpage>. <pub-id pub-id-type="doi">10.1186/1478-811X-8-3</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mukherjee</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Dhawan</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Saini</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Muscle hypertrophy in a child with progressive weakness-thinking beyond muscular dystrophy</article-title>. <source>J.&#x20;Clin. Neuromuscul. Dis.</source> <volume>20</volume>, <fpage>140</fpage>&#x2013;<lpage>141</lpage>. <pub-id pub-id-type="doi">10.1097/CND.0000000000000227</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Norwood</surname>
<given-names>F. L. M.</given-names>
</name>
<name>
<surname>Harling</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Chinnery</surname>
<given-names>P. F.</given-names>
</name>
<name>
<surname>Eagle</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bushby</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Straub</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Prevalence of genetic muscle disease in northern England: in-depth analysis of a muscle clinic population</article-title>. <source>Brain</source> <volume>132</volume>, <fpage>3175</fpage>&#x2013;<lpage>3186</lpage>. <pub-id pub-id-type="doi">10.1093/brain/awp236</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oti</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Brunner</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>The modular nature of genetic diseases</article-title>. <source>Clin. Genet.</source> <volume>71</volume>, <fpage>1</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1111/j.1399-0004.2006.00708.x</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pavlopoulos</surname>
<given-names>G. A.</given-names>
</name>
<name>
<surname>Kontou</surname>
<given-names>P. I.</given-names>
</name>
<name>
<surname>Pavlopoulou</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bouyioukos</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Markou</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Bagos</surname>
<given-names>P. G.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Bipartite graphs in systems biology and medicine: a survey of methods and applications</article-title>. <source>Gigascience</source> <volume>7</volume>, <fpage>1</fpage>&#x2013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1093/gigascience/giy014</pub-id> </citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pfeffer</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Chinnery</surname>
<given-names>P. F.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Diagnosis and treatment of mitochondrial myopathies</article-title>. <source>Ann. Med.</source> <volume>45</volume>, <fpage>4</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.3109/07853890.2011.605389</pub-id> </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Piccolo</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Frampton</surname>
<given-names>M. B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Tools and techniques for computational reproducibility</article-title>. <source>Gigascience</source> <volume>5</volume>, <fpage>30</fpage>. <pub-id pub-id-type="doi">10.1186/s13742-016-0135-4</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ren</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Decipher the connections between proteins and phenotypes</article-title>. <source>Biochim. Biophys. Acta - Proteins Proteom.</source> <volume>1868</volume>, <fpage>140503</fpage>. <pub-id pub-id-type="doi">10.1016/j.bbapap.2020.140503</pub-id> </citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rodr&#xed;guez Cruz</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Palace</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Beeson</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>The neuromuscular junction and wide heterogeneity of congenital myasthenic syndromes</article-title>. <source>Int. J.&#x20;Mol. Sci.</source> <volume>19</volume>, <fpage>1677</fpage>. <pub-id pub-id-type="doi">10.3390/ijms19061677</pub-id> </citation>
</ref>
<ref id="B55">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Rojano</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Seoane</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Bueno-Amoros</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Perkins</surname>
<given-names>J.&#x20;R.</given-names>
</name>
<name>
<surname>Garcia-Ranea</surname>
<given-names>J.&#x20;A.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>Revealing the relationship between human genome regions and pathological phenotypes through network analysis</article-title>,&#x201d; in <source>Lecture notes in computer science (including subseries lecture notes in artificial intelligence and lecture notes in bioinformatics)</source>, <publisher-loc>Cham, Switzerland</publisher-loc>, <fpage>197</fpage>&#x2013;<lpage>207</lpage>. </citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rossoll</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Bassell</surname>
<given-names>G. J.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Spinal muscular atrophy and a model for survival of motor neuron protein function in axonal ribonucleoprotein complexes</article-title>. <source>Results Probl. Cell Differ.</source> <volume>48</volume>, <fpage>289</fpage>&#x2013;<lpage>326</lpage>. <pub-id pub-id-type="doi">10.1007/400_2009_4</pub-id> </citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roy</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Van den Bergh</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Van Damme</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Doggen</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Van Casteren</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Van Casteren</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Early stages of building a rare disease registry, methods and 2010 data from the Belgian neuromuscular disease registry (BNMDR)</article-title>. <source>Acta Neurol. Belg.</source> <volume>115</volume>, <fpage>97</fpage>&#x2013;<lpage>104</lpage>. <pub-id pub-id-type="doi">10.1007/s13760-014-0320-0</pub-id> </citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rzhetsky</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wajngurt</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Probing genetic overlap among complex human phenotypes</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>104</volume>, <fpage>11694</fpage>&#x2013;<lpage>11699</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0704820104</pub-id> </citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sarnat</surname>
<given-names>H. B.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>New insights into the pathogenesis of congenital myopathies</article-title>. <source>J.&#x20;Child Neurol.</source> <volume>9</volume>, <fpage>193</fpage>&#x2013;<lpage>201</lpage>. <pub-id pub-id-type="doi">10.1177/088307389400900218</pub-id> </citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sciandra</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Bozzi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bianchi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pavoni</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Giardina</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Brancaccio</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Dystroglycan and muscular dystrophies related to the dystrophin-glycoprotein complex</article-title>. <source>Ann. Ist. Super Sanita</source> <volume>39</volume>, <fpage>173</fpage>&#x2013;<lpage>181</lpage>. </citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scoto</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Finkel</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mercuri</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Muntoni</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Genetic therapies for inherited neuromuscular disorders</article-title>. <source>Lancet Child Adolesc. Health</source> <volume>2</volume>, <fpage>600</fpage>&#x2013;<lpage>609</lpage>. <pub-id pub-id-type="doi">10.1016/S2352-4642(18)30140-8</pub-id> </citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scotton</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Passarelli</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Neri</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ferlini</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Biomarkers in rare neuromuscular diseases</article-title>. <source>Exp. Cell Res.</source> <volume>325</volume>, <fpage>44</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1016/j.yexcr.2013.12.020</pub-id> </citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seoane</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Oca&#xf1;a</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Carmona</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bautista</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Madrid</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Torres</surname>
<given-names>A. M.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>AutoFlow, a versatile workflow engine illustrated by assembling an optimised <italic>de novo</italic> transcriptome for a non-model species, such as faba bean (<italic>Vicia faba</italic>)</article-title>. <source>Curr. Bioinform.</source> <volume>11</volume>, <fpage>1</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.2174/1574893611666160212235117</pub-id> </citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singleton</surname>
<given-names>M. V.</given-names>
</name>
<name>
<surname>Guthery</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Voelkerding</surname>
<given-names>K. V.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Kennedy</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Margraf</surname>
<given-names>R. L.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Phevor combines multiple biomedical ontologies for accurate identification of disease-causing alleles in single individuals and small nuclear families</article-title>. <source>Am. J.&#x20;Hum. Genet.</source> <volume>94</volume>, <fpage>599</fpage>&#x2013;<lpage>610</lpage>. <pub-id pub-id-type="doi">10.1016/j.ajhg.2014.03.010</pub-id> </citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sirota</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Schaub</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Batzoglou</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Robinson</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Butte</surname>
<given-names>A. J.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Autoimmune disease classification by inverse association with SNP alleles</article-title>. <source>PLoS Genet.</source> <volume>5</volume>, <fpage>e1000792</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1000792</pub-id> </citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Souza</surname>
<given-names>P. V. S. d.</given-names>
</name>
<name>
<surname>Batistella</surname>
<given-names>G. N. d. R.</given-names>
</name>
<name>
<surname>Lino</surname>
<given-names>V. C.</given-names>
</name>
<name>
<surname>Pinto</surname>
<given-names>W. B. V. d. R.</given-names>
</name>
<name>
<surname>Annes</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Oliveira</surname>
<given-names>A. S. B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Clinical and genetic basis of congenital myasthenic syndromes</article-title>. <source>Arq. Neuro-Psiquiatr.</source> <volume>74</volume>, <fpage>750</fpage>&#x2013;<lpage>760</lpage>. <pub-id pub-id-type="doi">10.1590/0004-282X20160106</pub-id> </citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Spence</surname>
<given-names>H. J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.-J.</given-names>
</name>
<name>
<surname>Winder</surname>
<given-names>S. J.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Muscular dystrophies, the cytoskeleton and cell adhesion</article-title>. <source>Bioessays</source> <volume>24</volume>, <fpage>542</fpage>&#x2013;<lpage>552</lpage>. <pub-id pub-id-type="doi">10.1002/bies.10098</pub-id> </citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Spuler</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Stroux</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kuschel</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Kuhlmey</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kendel</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Delay in diagnosis of muscle disorders depends on the subspecialty of the initially consulted physician</article-title>. <source>BMC Health Serv. Res.</source> <volume>11</volume>, <fpage>91</fpage>. <pub-id pub-id-type="doi">10.1186/1472-6963-11-91</pub-id> </citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tan</surname>
<given-names>N. B.</given-names>
</name>
<name>
<surname>Stapleton</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Stark</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Delatycki</surname>
<given-names>M. B.</given-names>
</name>
<name>
<surname>Yeung</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hunter</surname>
<given-names>M. F.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Evaluating systematic reanalysis of clinical genomic data in rare disease from single center experience and literature review</article-title>. <source>Mol. Genet. Genomic Med.</source> <volume>8</volume>, <fpage>e1508</fpage>. <pub-id pub-id-type="doi">10.1002/mgg3.1508</pub-id> </citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thavorntanaburt</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Tanboon</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Likasitwattanakul</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sangruchi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Nishino</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Ngerncham</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Impact of muscle biopsy on diagnosis and management of children with neuromuscular diseases: a 10-year retrospective critical review</article-title>. <source>J.&#x20;Pediatr. Surg.</source> <volume>53</volume>, <fpage>489</fpage>&#x2013;<lpage>492</lpage>. <pub-id pub-id-type="doi">10.1016/j.jpedsurg.2017.06.006</pub-id> </citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Turakhia</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Barrick</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Berman</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Patients with neuromuscular disorder</article-title>. <source>Med. Clin. N. Am.</source> <volume>97</volume>, <fpage>1015</fpage>&#x2013;<lpage>1032</lpage>. <pub-id pub-id-type="doi">10.1016/j.mcna.2013.05.005</pub-id> </citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Uhl&#xe9;n</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fagerberg</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Hallstr&#xf6;m</surname>
<given-names>B. M.</given-names>
</name>
<name>
<surname>Lindskog</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Oksvold</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Mardinoglu</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Tissue-based map of the human proteome</article-title>. <source>Science</source> <volume>347</volume>, <fpage>1260419</fpage>. <pub-id pub-id-type="doi">10.1126/science.1260419</pub-id> </citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Urda</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Arag&#xf3;n</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Bautista</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Franco</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Veredas</surname>
<given-names>F. J.</given-names>
</name>
<name>
<surname>Claros</surname>
<given-names>M. G.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Blasso: integration of biological knowledge into a regularized linear model</article-title>. <source>BMC Syst. Biol.</source> <volume>12</volume>, <fpage>94</fpage>. <pub-id pub-id-type="doi">10.1186/s12918-018-0612-8</pub-id> </citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vasant</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chanas</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Malone</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hanauer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Olry</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Jupp</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Ordo: an ontology connecting rare disease, epidemiology and genetic data</article-title>. <source>Phenotype data at ISMB2014</source>, <fpage>1</fpage>&#x2013;<lpage>4</lpage>. <comment>Available at <ext-link ext-link-type="uri" xlink:href="https://www.researchgate.net/profile/Drashtti-Vasant/publication/281824026_ORDO_An_Ontology_Connecting_Rare_Disease_Epidemiology_and_Genetic_Data/links/55f99bc408aeafc8ac266edf/ORDO-An-Ontology-Connecting-Rare-Disease-Epidemiology-and-Genetic-Data.pdf">https://www.researchgate.net/profile/Drashtti-Vasant/publication/281824026_ORDO_An_Ontology_Connecting_Rare_Disease_Epidemiology_and_Genetic_Data/links/55f99bc408aeafc8ac266edf/ORDO-An-Ontology-Connecting-Rare-Disease-Epidemiology-and-Genetic-Data.pdf</ext-link>
</comment> </citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Robinson</surname>
<given-names>P. N.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Phenolyzer: phenotype-based prioritization of candidate genes for human diseases</article-title>. <source>Nat. Methods</source> <volume>12</volume>, <fpage>841</fpage>&#x2013;<lpage>843</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.3484</pub-id> </citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kwoh</surname>
<given-names>C.-K.</given-names>
</name>
<name>
<surname>Ng</surname>
<given-names>S.-K.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Inferring gene-phenotype associations via global protein complex network propagation</article-title>. <source>PLoS One</source> <volume>6</volume>, <fpage>e21502</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0021502</pub-id> </citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>Q.-Y.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>ReactomePA: an R/Bioconductor package for reactome pathway analysis and visualization</article-title>. <source>Mol. Biosyst.</source> <volume>12</volume>, <fpage>477</fpage>&#x2013;<lpage>479</lpage>. <pub-id pub-id-type="doi">10.1039/c5mb00663e</pub-id> </citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.-G.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>Q.-Y.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>ClusterProfiler: an R package for comparing biological themes among gene clusters</article-title>. <source>OMICS: A J.&#x20;Integr. Biol.</source> <volume>16</volume>, <fpage>284</fpage>&#x2013;<lpage>287</lpage>. <pub-id pub-id-type="doi">10.1089/omi.2011.0118</pub-id> </citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Kramer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Dutkowski</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Srivas</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Licon</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Kreisberg</surname>
<given-names>J.&#x20;F.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Translation of genotype to phenotype by a hierarchy of cell subsystems</article-title>. <source>Cell Syst.</source> <volume>2</volume>, <fpage>77</fpage>&#x2013;<lpage>88</lpage>. <pub-id pub-id-type="doi">10.1016/j.cels.2016.02.003</pub-id> </citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The slc transporter in nutrient and metabolic sensing, regulation, and drug development</article-title>. <source>J.&#x20;Mol. Cell Biol.</source> <volume>11</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1093/jmcb/mjy052</pub-id> </citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Havrilla</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Phen2Gene: rapid phenotype-driven gene prioritization for rare diseases</article-title>. <source>NAR Genomics and Bioinformatics</source> <volume>2</volume>, <fpage>lqaa032</fpage>. <pub-id pub-id-type="doi">10.1093/nargab/lqaa032</pub-id> </citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Menche</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Barab&#xe1;si</surname>
<given-names>A.-L.</given-names>
</name>
<name>
<surname>Sharma</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Human symptoms-disease network</article-title>. <source>Nat. Commun.</source> <volume>5</volume>, <fpage>4212</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms5212</pub-id> </citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Notterpek</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Promoting peripheral myelin repair</article-title>. <source>Exp. Neurol.</source> <volume>283</volume>, <fpage>573</fpage>&#x2013;<lpage>580</lpage>. <pub-id pub-id-type="doi">10.1016/j.expneurol.2016.04.007</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>
