<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article
  PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "http://dtd.nlm.nih.gov/publishing/3.0/journalpublishing3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="3.0" xml:lang="EN">
<front>
<journal-meta><journal-id journal-id-type="publisher-id">plos</journal-id><journal-id journal-id-type="nlm-ta">PLoS Comput Biol</journal-id><journal-id journal-id-type="pmc">ploscomp</journal-id><!--===== Grouping journal title elements =====--><journal-title-group><journal-title>PLoS Computational Biology</journal-title></journal-title-group><issn pub-type="ppub">1553-734X</issn><issn pub-type="epub">1553-7358</issn><publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, USA</publisher-loc></publisher></journal-meta>
<article-meta><article-id pub-id-type="publisher-id">08-PLCB-RA-0966R2</article-id><article-id pub-id-type="doi">10.1371/journal.pcbi.1000374</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="Discipline"><subject>Cardiovascular Disorders</subject><subject>Computational Biology/Literature Analysis</subject><subject>Computational Biology/Systems Biology</subject><subject>Gastroenterology and Hepatology</subject><subject>Genetics and Genomics/Bioinformatics</subject><subject>Genetics and Genomics/Disease Models</subject><subject>Genetics and Genomics/Gene Discovery</subject><subject>Genetics and Genomics/Genetics of Disease</subject><subject>Genetics and Genomics/Medical Genetics</subject><subject>Mathematics/Statistics</subject><subject>Neurological Disorders</subject><subject>Ophthalmology</subject></subj-group></article-categories><title-group><article-title>Mapping Gene Associations in Human Mitochondria using Clinical Disease Phenotypes</article-title><alt-title alt-title-type="running-head">Mitochondrial Disease Phenotypes</alt-title></title-group><contrib-group>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Scharfe</surname><given-names>Curt</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="corresp" rid="cor1"><sup>*</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Lu</surname><given-names>Henry Horng-Shing</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Neuenburg</surname><given-names>Jutta K.</given-names></name><xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Allen</surname><given-names>Edward A.</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Li</surname><given-names>Guan-Cheng</given-names></name><xref ref-type="aff" rid="aff4"><sup>4</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Klopstock</surname><given-names>Thomas</given-names></name><xref ref-type="aff" rid="aff5"><sup>5</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Cowan</surname><given-names>Tina M.</given-names></name><xref ref-type="aff" rid="aff6"><sup>6</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Enns</surname><given-names>Gregory M.</given-names></name><xref ref-type="aff" rid="aff7"><sup>7</sup></xref></contrib>
<contrib contrib-type="author" xlink:type="simple"><name name-style="western"><surname>Davis</surname><given-names>Ronald W.</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
</contrib-group><aff id="aff1"><label>1</label><addr-line>Stanford Genome Technology Center, Stanford University, Palo Alto, California, United States of America</addr-line>       </aff><aff id="aff2"><label>2</label><addr-line>Institute of Statistics, National Chiao Tung University, Hsinchu, Taiwan</addr-line>       </aff><aff id="aff3"><label>3</label><addr-line>BioMarin Pharmaceutical, Novato, California, United States of America</addr-line>       </aff><aff id="aff4"><label>4</label><addr-line>Department of Operations Research, University of California Berkeley, Berkeley, California, United States of America</addr-line>       </aff><aff id="aff5"><label>5</label><addr-line>Friedrich-Baur-Institute, Department of Neurology, Ludwig Maximilians University, Munich, Germany</addr-line>       </aff><aff id="aff6"><label>6</label><addr-line>Departments of Pathology and Pediatrics, Stanford University, Stanford, California, United States of America</addr-line>       </aff><aff id="aff7"><label>7</label><addr-line>Department of Pediatrics, Medical Genetics Division, Stanford University, Stanford, California, United States of America</addr-line>       </aff><contrib-group>
<contrib contrib-type="editor" xlink:type="simple"><name name-style="western"><surname>Rzhetsky</surname><given-names>Andrey</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/></contrib>
</contrib-group><aff id="edit1">University of Chicago, United States of America</aff><author-notes>
<corresp id="cor1">* E-mail: <email xlink:type="simple">curts@stanford.edu</email></corresp>
<fn fn-type="con"><p>Conceived and designed the experiments: CS. Analyzed the data: CS HHSL GCL. Contributed reagents/materials/analysis tools: CS HHSL JKN EAA TK TMC GME RWD. Wrote the paper: CS. Collected and annotated phenotype data: CS TMC GME. Established the phenome ontology: CS JKN TK TMC GME. Created the online knowledgebase: CS EAA.</p></fn>
<fn fn-type="conflict"><p>The authors have declared that no competing interests exist.</p></fn></author-notes><pub-date pub-type="collection"><month>4</month><year>2009</year></pub-date><pub-date pub-type="epub"><day>24</day><month>4</month><year>2009</year></pub-date><volume>5</volume><issue>4</issue><elocation-id>e1000374</elocation-id><history>
<date date-type="received"><day>27</day><month>10</month><year>2008</year></date>
<date date-type="accepted"><day>24</day><month>3</month><year>2009</year></date>
</history><!--===== Grouping copyright info into permissions =====--><permissions><copyright-year>2009</copyright-year><copyright-holder>Scharfe et al</copyright-holder><license><license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p></license></permissions><abstract>
<p>Nuclear genes encode most mitochondrial proteins, and their mutations cause diverse and debilitating clinical disorders. To date, 1,200 of these mitochondrial genes have been recorded, while no standardized catalog exists of the associated clinical phenotypes. Such a catalog would be useful to develop methods to analyze human phenotypic data, to determine genotype-phenotype relations among many genes and diseases, and to support the clinical diagnosis of mitochondrial disorders. Here we establish a clinical phenotype catalog of 174 mitochondrial disease genes and study associations of diseases and genes. Phenotypic features such as clinical signs and symptoms were manually annotated from full-text medical articles and classified based on the hierarchical MeSH ontology. This classification of phenotypic features of each gene allowed for the comparison of diseases between different genes. In turn, we were then able to measure the phenotypic associations of disease genes for which we calculated a quantitative value that is based on their shared phenotypic features. The results showed that genes sharing more similar phenotypes have a stronger tendency for functional interactions, proving the usefulness of phenotype similarity values in disease gene network analysis. We then constructed a functional network of mitochondrial genes and discovered a higher connectivity for non-disease than for disease genes, and a tendency of disease genes to interact with each other. Utilizing these differences, we propose 168 candidate genes that resemble the characteristic interaction patterns of mitochondrial disease genes. Through their network associations, the candidates are further prioritized for the study of specific disorders such as optic neuropathies and Parkinson disease. Most mitochondrial disease phenotypes involve several clinical categories including neurologic, metabolic, and gastrointestinal disorders, which might indicate the effects of gene defects within the mitochondrial system. The accompanying knowledgebase (<ext-link ext-link-type="uri" xlink:href="http://www.mitophenome.org/" xlink:type="simple">http://www.mitophenome.org/</ext-link>) supports the study of clinical diseases and associated genes.</p>
</abstract><abstract abstract-type="summary"><title>Author Summary</title>
<p>An important prerequisite for successful disease gene identification is the assessment, with minimal ambiguity, of a particular clinical trait or phenotype. Even with years of experience, recognizing and diagnosing mitochondrial diseases is still a major hurdle in clinical medicine. Computational tools supporting clinicians not only help identify affected individuals, but also guide studies of the genetic and biological causes of these disorders. In this study we dissect and categorize individual clinical features, signs, and symptoms of 174 disease genes and then identify gene similarities based on their shared phenotypic features. We demonstrate that genes sharing more similar phenotypes have a stronger tendency for functional interactions, proving the usefulness of phenotype similarity values in disease gene network analysis. Our study of a large functional network of mitochondrial genes revealed distinct properties that differentiate disease and non-disease genes. Disease genes showed a lower average total connectivity but a tendency to interact with each other; a finding that we used to predict 168 high-probability disease candidates. The accompanying knowledgebase allows for easy navigation between disease and gene information. We believe the open source format will support and encourage further research that will benefit this and other human phenome projects.</p>
</abstract><funding-group><funding-statement>This work was supported by a National Eye Institute grant (to R.W.D. and C.S.) and a NSC grant in Taiwan (to H.H.L.). T.K. is a member of MitoNET funded by the German ministry of education and research (BMBF). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement></funding-group><counts><page-count count="12"/></counts></article-meta>
</front>
<body><sec id="s1">
<title>Introduction</title>
<p>Mitochondrial diseases are caused by an abnormal function of mitochondria. They may be the result of spontaneous or inherited mutations in the mitochondrial genome (mtDNA) or in nuclear genes that code for mitochondrial components, but may also be acquired secondary to adverse effects of drugs, infections, or other environmental causes <xref ref-type="bibr" rid="pcbi.1000374-Luft1">[1]</xref>–<xref ref-type="bibr" rid="pcbi.1000374-Wallace1">[3]</xref>. The mtDNA encodes only 13 proteins of the respiratory chain <xref ref-type="bibr" rid="pcbi.1000374-Anderson1">[4]</xref>, while most of the estimated 1,500 mitochondrial proteins are nuclear-encoded <xref ref-type="bibr" rid="pcbi.1000374-Prokisch1">[5]</xref>. Mitochondrial deficiencies often affect multiple tissues leading to multi-system diseases that present with many phenotypic features. These dysfunctions appear to be more prevalent in hereditary diseases than previously anticipated <xref ref-type="bibr" rid="pcbi.1000374-Chinnery1">[6]</xref>–<xref ref-type="bibr" rid="pcbi.1000374-Skladal1">[8]</xref> and have also been attributed to the pathogenesis of common conditions associated with aging <xref ref-type="bibr" rid="pcbi.1000374-Wallace1">[3]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Enns1">[9]</xref> including neurodegenerative diseases <xref ref-type="bibr" rid="pcbi.1000374-Dawson1">[10]</xref>, cardiovascular disorders <xref ref-type="bibr" rid="pcbi.1000374-Rosca1">[11]</xref>, diabetes mellitus <xref ref-type="bibr" rid="pcbi.1000374-Lowell1">[12]</xref>, and several cancer types <xref ref-type="bibr" rid="pcbi.1000374-Delsite1">[13]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Eng1">[14]</xref>.</p>
<p>Medical case reports of specific gene defects have been crucial to our understanding of clinical phenotypes. The list of mitochondrial disease genes and case reports has grown rapidly, while methods for defining and assaying clinical phenotypes are still inadequate <xref ref-type="bibr" rid="pcbi.1000374-Freimer1">[15]</xref>–<xref ref-type="bibr" rid="pcbi.1000374-Biesecker1">[17]</xref>. Accordingly, the accurate and systematic comparison of clinical phenotypes associated with different disease genes remains a major challenge. One limitation is the non-standardized formats of such phenotypic data in the medical literature and databases, which is difficult to overcome using automated text mining <xref ref-type="bibr" rid="pcbi.1000374-Nadkarni1">[18]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-vanDriel1">[19]</xref>. An example are optic nerve diseases for which multiple terms are found such as cranial nerve II diseases, neural-optic lesion, optic disk disorder, and optic atrophy. Higher-level phenome knowledgebases recently emerged in an attempt to comprehensively index human phenotype data <xref ref-type="bibr" rid="pcbi.1000374-Singer1">[20]</xref>–<xref ref-type="bibr" rid="pcbi.1000374-Sabb1">[22]</xref>. The process of transforming descriptions of medical diagnoses and procedures into universal computer-readable medical code numbers involves manual reviews and annotations of full-text articles <xref ref-type="bibr" rid="pcbi.1000374-Biesecker1">[17]</xref>. As with other knowledgebases <xref ref-type="bibr" rid="pcbi.1000374-Calvano1">[23]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-HernandezBoussard1">[24]</xref>, catalogs of clinical phenotypes are set within the context of the existing literature, but are also limited by the inherent problems of working with an evolving literature.</p>
<p>In this study, we catalogued detailed information on clinical disease phenotypes of known mitochondrial gene defects that were stored in a phenome knowledgebase. We then developed methods to analyze the clinical phenotype information, to determine associations of genes and diseases, and to compare different disease genes based on their associated phenotypes. This approach was used to predict disease gene similarities, which showed positive correlations to their functional interactions. Our analysis of a functional interaction network of mitochondrial genes revealed distinct properties for disease and non-disease genes, which we utilized to predict new disease candidate genes. Our knowledgebase (<ext-link ext-link-type="uri" xlink:href="http://www.mitophenome.org" xlink:type="simple">www.mitophenome.org</ext-link>) represents a new resource for studying links between disorders and genes. This can be integrated with a variety of systems approaches <xref ref-type="bibr" rid="pcbi.1000374-Vo1">[25]</xref> with the goal of identifying disease gene variants in the individuals that carry them.</p>
</sec><sec id="s2">
<title>Results</title>
<sec id="s2a">
<title>Annotation of mitochondrial genes and diseases</title>
<p>We identified 174 nuclear-encoded mitochondrial genes (<xref ref-type="supplementary-material" rid="pcbi.1000374.s004"><bold>Table S1</bold></xref>) associated with 191 diseases in the Online Mendelian Inheritance in Man (OMIM) database <xref ref-type="bibr" rid="pcbi.1000374-Hamosh1">[26]</xref>. In order to characterize these disorders in detail, we manually searched the PubMed literature for their phenotypic features such as clinical signs and symptoms, biochemical and clinical laboratory tests, and neurological imaging findings. Our annotations consisted of three steps that included the collection, definition, and classification of phenotypic features for each disease gene. Importantly, we individually matched the phenotypic features with standardized descriptors in the Medical Subject Headings (MeSH) database <xref ref-type="bibr" rid="pcbi.1000374-httpwww.nlm.nih.govmeshmeshhome.html1">[27]</xref>. Within the hierarchical MeSH ontology, we localized the individual feature position and then identified, for each feature, the directly related parent descriptor or hypernym feature. Using this approach, we reviewed 1,636 full-text articles reporting defects or deficiencies in the 174 disease genes and individually extracted phenotypic features for each gene. We then matched features with MeSH descriptors and identified their hypernyms, which generated 502 features hierarchically classified within the mitochondrial phenotype ontology (<xref ref-type="supplementary-material" rid="pcbi.1000374.s005"><bold>Table S2</bold></xref>). At its root, the ontology has fourteen features corresponding to fourteen major clinical categories (CC) such as cardiovascular diseases or neurological diseases. These CC are used to discriminate the more specific features in each group: for example arrhythmia in the cardiovascular CC and seizures in the neurologic CC. A subset of the features in our phenotype ontology is listed in <xref ref-type="table" rid="pcbi-1000374-t001"><bold>Table 1</bold></xref>.</p>
<table-wrap id="pcbi-1000374-t001" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.1000374.t001</object-id><label>Table 1</label><caption>
<title>Phenotypic features of human mitochondrial diseases.</title>
</caption><!--===== Grouping alternate versions of objects =====--><alternatives><graphic id="pcbi-1000374-t001-1" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.t001" xlink:type="simple"/><table><colgroup span="1"><col align="left" span="1"/><col align="center" span="1"/><col align="center" span="1"/></colgroup>
<tbody>
<tr>
<td align="left" colspan="1" rowspan="1"><bold>1. Cardiovascular</bold> (110)</td>
<td align="left" colspan="1" rowspan="1"><bold>7. Immunologic</bold> (78)</td>
<td align="left" colspan="1" rowspan="1">Neuromuscular-manifestations (129)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Arrhythmia (38)</td>
<td align="left" colspan="1" rowspan="1">Autoimmune-diseases (2)</td>
<td align="left" colspan="1" rowspan="1">Paralysis-Paresis (39)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Cardiomyopathy (44)</td>
<td align="left" colspan="1" rowspan="1">Immune-deficiency (7)</td>
<td align="left" colspan="1" rowspan="1">Reflexes-abnormal (78)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Cardiorespiratory-arrest (81)</td>
<td align="left" colspan="1" rowspan="1">Infections (76)</td>
<td align="left" colspan="1" rowspan="1">Hearing-disorders (30)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Hypertension (20)</td>
<td align="left" colspan="1" rowspan="1"><bold>8. Metabolic</bold> (143)</td>
<td align="left" colspan="1" rowspan="1">Voice-disorders (11)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Hypotension (19)</td>
<td align="left" colspan="1" rowspan="1">Acidosis (87)</td>
<td align="left" colspan="1" rowspan="1">Stroke-like-episodes (10)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Myocardial-ischemia (6)</td>
<td align="left" colspan="1" rowspan="1">Reye-like-symptoms (15)</td>
<td align="left" colspan="1" rowspan="1">Developmental-delay (111)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1"><bold>2. Dermatologic</bold> (56)</td>
<td align="left" colspan="1" rowspan="1">Dyslipidemias (14)</td>
<td align="left" colspan="1" rowspan="1">Polyneuropathies (37)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Dermatitis (7)</td>
<td align="left" colspan="1" rowspan="1">Diabetes-mellitus (18)</td>
<td align="left" colspan="1" rowspan="1">Sleep-disorders (11)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Hair-diseases (15)</td>
<td align="left" colspan="1" rowspan="1">Hyperglycemia (12)</td>
<td align="left" colspan="1" rowspan="1"><bold>11. Oncologic</bold> (29)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Pigmentation-disorders (11)</td>
<td align="left" colspan="1" rowspan="1">Hyperinsulinism (5)</td>
<td align="left" colspan="1" rowspan="1">Squamous-cell-neoplasms (4)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Hyperhidrosis (15)</td>
<td align="left" colspan="1" rowspan="1">Hypoglycemia (52)</td>
<td align="left" colspan="1" rowspan="1">Neuroendocrine-tumors (6)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Paleness (22)</td>
<td align="left" colspan="1" rowspan="1">Hyperammonemia (40)</td>
<td align="left" colspan="1" rowspan="1">Paraganglioma (3)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1"><bold>3. Endocrinologic</bold> (40)</td>
<td align="left" colspan="1" rowspan="1">Hyperbilirubinemia (23)</td>
<td align="left" colspan="1" rowspan="1">Leukemia-Lymphoma (9)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Adrenal-gland-diseases (14)</td>
<td align="left" colspan="1" rowspan="1">Hemochromatosis (11)</td>
<td align="left" colspan="1" rowspan="1">Breast-neoplasms (5)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Adrenal-insufficiency (9)</td>
<td align="left" colspan="1" rowspan="1">Aminoacid-levels-abnormal (47)</td>
<td align="left" colspan="1" rowspan="1">Colorectal-neoplasms (4)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Adrenocortical-hyperfunction (7)</td>
<td align="left" colspan="1" rowspan="1">Water-electrolyte-imbalance (49)</td>
<td align="left" colspan="1" rowspan="1">Hepatocellular-carcinoma (7)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Gonadal-disorders (23)</td>
<td align="left" colspan="1" rowspan="1">Obesity (8)</td>
<td align="left" colspan="1" rowspan="1">Leiomyoma (4)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Sex-differentiation-disorders (12)</td>
<td align="left" colspan="1" rowspan="1">Fatty-acids-abnormal (21)</td>
<td align="left" colspan="1" rowspan="1">Prostatic-neoplasms (4)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Parathyroid-diseases (5)</td>
<td align="left" colspan="1" rowspan="1">Organic-acids-abnormal (69)</td>
<td align="left" colspan="1" rowspan="1">Renal-cell-carcinoma (4)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Pituitary-diseases (10)</td>
<td align="left" colspan="1" rowspan="1">Dicarboxylic-aciduria (20)</td>
<td align="left" colspan="1" rowspan="1"><bold>12. Ophthalmologic</bold> (87)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Thyroid-diseases (18)</td>
<td align="left" colspan="1" rowspan="1"><bold>9. Musculosceletal</bold> (95)</td>
<td align="left" colspan="1" rowspan="1">Blepharoptosis (20)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1"><bold>4. Gastrointestinal</bold> (132)</td>
<td align="left" colspan="1" rowspan="1">Osteoporosis (8)</td>
<td align="left" colspan="1" rowspan="1">Cataract (15)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Cholestasis (16)</td>
<td align="left" colspan="1" rowspan="1">Spinal-diseases (25)</td>
<td align="left" colspan="1" rowspan="1">Pathologic-nystagmus (38)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Deglutition-disorders (29)</td>
<td align="left" colspan="1" rowspan="1">Pathological-fractures (9)</td>
<td align="left" colspan="1" rowspan="1">Ophthalmoplegia (15)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Gastroenteritis (28)</td>
<td align="left" colspan="1" rowspan="1">Foot-deformities (20)</td>
<td align="left" colspan="1" rowspan="1">Optic-nerve-diseases (34)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Intestinal-obstruction (13)</td>
<td align="left" colspan="1" rowspan="1">Joint-diseases (18)</td>
<td align="left" colspan="1" rowspan="1">Retinal-diseases (27)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Gastrointestinal-hemorrhage (9)</td>
<td align="left" colspan="1" rowspan="1">Muscular-diseases (38)</td>
<td align="left" colspan="1" rowspan="1">Color-vision-defects (7)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Liver-diseases (79)</td>
<td align="left" colspan="1" rowspan="1">Rhabdomyolysis (8)</td>
<td align="left" colspan="1" rowspan="1"><bold>13. Psychiatric</bold> (51)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Fatty-liver (34)</td>
<td align="left" colspan="1" rowspan="1">Microcephaly (39)</td>
<td align="left" colspan="1" rowspan="1">Aggression (15)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Pancreatitis (9)</td>
<td align="left" colspan="1" rowspan="1"><bold>10. Neurologic</bold> (154)</td>
<td align="left" colspan="1" rowspan="1">Feeding-behavior (8)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Abdominal-pain (31)</td>
<td align="left" colspan="1" rowspan="1">Brain-diseases (135)</td>
<td align="left" colspan="1" rowspan="1">Anxiety-disorders (18)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Feeding-difficulties (67)</td>
<td align="left" colspan="1" rowspan="1">Intracranial-hemorrhages (17)</td>
<td align="left" colspan="1" rowspan="1">Dementia (18)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Diarrhea (37)</td>
<td align="left" colspan="1" rowspan="1">Seizures (97)</td>
<td align="left" colspan="1" rowspan="1">Autistic-disorder (8)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Vomiting (80)</td>
<td align="left" colspan="1" rowspan="1">Headache-disorders (21)</td>
<td align="left" colspan="1" rowspan="1">Depressive-disorder (19)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1"><bold>5. Genitourinary</bold> (68)</td>
<td align="left" colspan="1" rowspan="1">Leukoencephalopathy (39)</td>
<td align="left" colspan="1" rowspan="1">Psychotic-disorders (20)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Infertility-male (7)</td>
<td align="left" colspan="1" rowspan="1">Cerebellar-atrophy (28)</td>
<td align="left" colspan="1" rowspan="1">Schizophrenia (8)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Hypospadias (6)</td>
<td align="left" colspan="1" rowspan="1">Corpus-callosum-hypoplasia (18)</td>
<td align="left" colspan="1" rowspan="1"><bold>14. Respiratory</bold> (108)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Cystic-kidney-diseases (7)</td>
<td align="left" colspan="1" rowspan="1">Choreatic-disorders (18)</td>
<td align="left" colspan="1" rowspan="1">Hyperventilation (40)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Nephrocalcinosis (4)</td>
<td align="left" colspan="1" rowspan="1">Dystonic-disorders (38)</td>
<td align="left" colspan="1" rowspan="1">Respiratory-insufficiency (51)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Renal-insufficiency (30)</td>
<td align="left" colspan="1" rowspan="1">Parkinsonian-disorders (12)</td>
<td align="left" colspan="1" rowspan="1">Asthma (8)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Urination-disorders (12)</td>
<td align="left" colspan="1" rowspan="1">Tremor (36)</td>
<td align="left" colspan="1" rowspan="1">Pneumonia (40)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Menstruation-disturbances (9)</td>
<td align="left" colspan="1" rowspan="1">Spinal-cord-diseases (29)</td>
<td align="left" colspan="1" rowspan="1">Pulmonary-edema (14)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Pregnancy-complications (15)</td>
<td align="left" colspan="1" rowspan="1">Neurogenic-bladder (10)</td>
<td align="left" colspan="1" rowspan="1"><bold>Miscellaneous</bold> (151)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1"><bold>6. Hematologic</bold> (75)</td>
<td align="left" colspan="1" rowspan="1">Ataxia (54)</td>
<td align="left" colspan="1" rowspan="1">Fever (52)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Anemia (34)</td>
<td align="left" colspan="1" rowspan="1">Speech-disorders (41)</td>
<td align="left" colspan="1" rowspan="1">Hypothermia (17)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Blood-coagulation-disorders (24)</td>
<td align="left" colspan="1" rowspan="1">Consciousness-disorders (65)</td>
<td align="left" colspan="1" rowspan="1">Exercise-intolerance (36)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Petechiae (4)</td>
<td align="left" colspan="1" rowspan="1">Memory-disorders (13)</td>
<td align="left" colspan="1" rowspan="1">Failure-to-thrive (62)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Blood-platelet-disorders (21)</td>
<td align="left" colspan="1" rowspan="1">Mental-retardation (68)</td>
<td align="left" colspan="1" rowspan="1">Growth-deficiency (54)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Blood-protein-disorders (20)</td>
<td align="left" colspan="1" rowspan="1">Hallucinations (14)</td>
<td align="left" colspan="1" rowspan="1">Dysmorphisms-abnormalities (39)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Bone-marrow-diseases (20)</td>
<td align="left" colspan="1" rowspan="1">Psychomotor-agitation (34)</td>
<td align="left" colspan="1" rowspan="1">Odors (10)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Leukocyte-disorders (25)</td>
<td align="left" colspan="1" rowspan="1">Irritability (39)</td>
<td align="left" colspan="1" rowspan="1">RCC-deficiencies (42)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Lymphatic-diseases (8)</td>
<td align="left" colspan="1" rowspan="1">Lethargy (69)</td>
<td align="left" colspan="1" rowspan="1">Vitamin-responsive (24)</td>
</tr>
</tbody>
</table></alternatives><table-wrap-foot><fn id="nt101"><p>The 144 features are selected from a total of 502 features (<xref ref-type="supplementary-material" rid="pcbi.1000374.s005"><bold>Table S2</bold></xref>) and are caused by defects in 174 nuclear-encoded mitochondrial genes. Every feature is associated with the number of genes shown in parentheses. The hierarchical structure of features within the phenotype ontology was established using standardized MeSH descriptors (not shown). The fourteen CC in bold serve as headers for features within them. Unassigned features are grouped under ‘Miscellaneous’.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2b">
<title>Clinical categories (CC) of mitochondrial disorders</title>
<p>A categorical breakdown of the 502 features in their fourteen CC is shown in the inner circle of <xref ref-type="fig" rid="pcbi-1000374-g001"><bold>Figure 1A</bold></xref>. While most CC were comprised of more than twenty individual features, the neurologic and metabolic CC contained the largest fraction of features (18.5% and 14.3%, respectively). We then explored the overall characteristics of mitochondrial phenotypes across all gene defects. We had annotated a total of 9,407 gene-feature pairs (<xref ref-type="supplementary-material" rid="pcbi.1000374.s006"><bold>Table S3</bold></xref>) that included, for each of the 174 disease genes, features identified through our literature search and hypernyms to these features assigned through integration with the phenotype ontology (see <xref ref-type="sec" rid="s4">methods</xref>). A relative breakdown of the fourteen CC across the 9,407 gene-feature pairs is shown in the outer circle of <xref ref-type="fig" rid="pcbi-1000374-g001"><bold>Figure 1A</bold></xref>. This analysis revealed CC patterns similar to the categorical distribution above, with neurological (33.3%) and metabolic (13.0%) features most prominently represented. Together with the third largest CC of gastrointestinal (8.6%) diseases, these three CC account for more than half of all features in all gene-feature pairs studied. In comparison, the oncologic and endocrinologic CC contained relative large numbers of features, but these categories were associated with fewer genes and are less frequently observed in mitochondrial disorders.</p>
<fig id="pcbi-1000374-g001" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.1000374.g001</object-id><label>Figure 1</label><caption>
<title>Distribution of clinical phenotypic features in mitochondrial diseases.</title>
<p>(A) The inner circle shows the distribution of 502 phenotypic features among fourteen clinical categories (CC), plus a ‘Miscellaneous’ category containing unassigned features. The numbers show the fraction in % of all features in one CC compared to all 502 features. The outer circle shows the distribution of features related to CC within the 9,407 gene-feature pairs, with the frequency in % of all features in one CC. (B) Number of genes with features in a specific CC (y-axis) in correlation to the average number of CC-specific features caused by these genes (x-axis). 154 genes caused neurological features with an average of 20.2 neurological features per gene. Phenotypically, most mitochondrial gene defects are related to neurological, metabolic and gastrointestinal diseases.</p>
</caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.g001" xlink:type="simple"/></fig>
<p>The distribution of phenotypes within CC is largely consistent with the tissue distribution of energy expenditure in the resting state, or basal metabolic rate (BMR), with brain contributing to the highest proportion of the BMR (90% in newborns, 60% in infants, and 25% in adults) <xref ref-type="bibr" rid="pcbi.1000374-Holliday1">[28]</xref>, followed by liver (20–25% BMR) and resting muscle (10–25% BMR). Mitochondria provide most of the body's energy <xref ref-type="bibr" rid="pcbi.1000374-Wallace1">[3]</xref>, and measurements of mitochondrial respiration have shown that brain tissue contains more active respiratory chain complexes than liver, heart, or muscle <xref ref-type="bibr" rid="pcbi.1000374-Benard1">[29]</xref>. Thus, our results showing a higher proportion of neurological, metabolic, and gastrointestinal (e.g. liver diseases) features positively correlate to BMR and respiratory-chain activities. A related analysis of genes associated with the fourteen CC confirms this observation (<xref ref-type="fig" rid="pcbi-1000374-g001"><bold>Figure 1B</bold></xref>). While most genes were associated with the neurologic, metabolic or gastrointestinal CC, these genes also caused more features within these CC. For example, 154 genes were associated with the neurological CC with each gene causing on average 20.3 neurological features. Although mitochondrial defects affect many cellular processes <xref ref-type="bibr" rid="pcbi.1000374-Prokisch1">[5]</xref>, the phenotype patterns predominantly represent deficiencies in energy metabolism with the nervous system being most susceptible. Like the gene-expression patterns in the study of human phenotypic diversity <xref ref-type="bibr" rid="pcbi.1000374-Storey1">[30]</xref>, CC patterns may aid to characterize and distinguish phenotype groups such as mitochondrial disorders.</p>
</sec><sec id="s2c">
<title>Clinical phenotype similarities between mitochondrial disease genes</title>
<p>Inherited diseases often present with multiple phenotypic features. The presence or absence of specific features is traditionally used to distinguish between different disorders and identify clinical traits <xref ref-type="bibr" rid="pcbi.1000374-Hamosh1">[26]</xref>. It is hypothesized that phenotype similarities of different disorders may indicate biological relationships of the underlying genes <xref ref-type="bibr" rid="pcbi.1000374-Freimer1">[15]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Brunner1">[16]</xref>. Several systematic studies have recently investigated genotype-phenotype associations in human genetic disorders <xref ref-type="bibr" rid="pcbi.1000374-vanDriel1">[19]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Butte1">[31]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Lage1">[32]</xref>. These approaches utilized automated text mining to extract phenotype information, while noting that currently available text formats and databases were not designed as structured resources for human phenotype analysis <xref ref-type="bibr" rid="pcbi.1000374-vanDriel1">[19]</xref>. Another study utilized disorder terms from OMIM's Morbid map and manually annotated each disorder into one of 22 disorder classes <xref ref-type="bibr" rid="pcbi.1000374-Goh1">[33]</xref>, which are comparable to our CC. Notably, the Morbid map terms represent only a small fraction of the phenotype information of a clinical disorder and genes with identical terms may cause phenotypic features from different CC. In order to explore associations of genes and features in mitochondrial diseases, we utilized our manually annotated 9,407 gene-feature pairs (<xref ref-type="supplementary-material" rid="pcbi.1000374.s006"><bold>Table S3</bold></xref>). Evidence for each gene-feature association is derived from one or more of 1,636 full-text articles, where each article is linked to a PubMed unique identifier (PMID). Using the PMID we computed the association ratio for each gene-feature pair. This ratio represents the number of PMID reporting a specific feature for a specific gene out of all PMID annotated for this gene. In addition, we determined the association ratios of pairs of genes linked to the same feature (see <xref ref-type="sec" rid="s4">Methods</xref>). The integration of association ratios for all features related to a gene pair enabled the prediction of quantitative phenotypic associations (QPA). Thus, QPA are a quantitative measure of phenotype similarity of disease genes causing one or more identical phenotypic feature.</p>
</sec><sec id="s2d">
<title>Correlation of phenotypic associations and gene functional interactions</title>
<p>We then compared disease genes with QPA and functional interactions, in order to explore the hypothesis of phenotypic similarities in functionally related genes <xref ref-type="bibr" rid="pcbi.1000374-Freimer1">[15]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Brunner1">[16]</xref>. We identified 1,928 gene pairs (n = 139 genes) from a recent study with Likelihood Ratios (LR) for gene functional interactions <xref ref-type="bibr" rid="pcbi.1000374-Franke1">[34]</xref>, and for which we had predicted QPA (<xref ref-type="supplementary-material" rid="pcbi.1000374.s007"><bold>Table S4</bold></xref>). Using rank correlation, we detected positive associations with significant confidence of QPA and LR for these disease gene pairs (Kendall: p = 4.67e-7; Spearman: p = 3.72e-7). The results indicated that genes with stronger evidence for functional interaction (higher LR) displayed greater similarities in their associated disease phenotypes (higher QPA). To select gene pairs with the highest correlation of LR and QPA, we applied hierarchical clustering and identified groups of gene pairs with higher to lower levels of association (see <xref ref-type="sec" rid="s4">Methods</xref>). In addition, we compared the 1,928 gene pairs with both LR and QPA to pairs predicted by only one method. Hypothesis testing revealed that these pairs showed on average higher values for LR (p = 6.86e-10) and QPA (p = 0.029) than pairs predicted by only one method (LR pairs only n = 82; QPA pairs only n = 26,010). Thus, LR and QPA in combination could be helpful in the analysis of disease gene associations.</p>
<p>In our next analysis we identified 39 disease genes encoding components of seven mitochondrial protein complexes and two metabolic pathways, representing nine functional modules (<xref ref-type="supplementary-material" rid="pcbi.1000374.s007"><bold>Table S4</bold></xref>). For each gene within a given module, we calculated the QPA average relative to all other genes in the module (<xref ref-type="fig" rid="pcbi-1000374-g002"><bold>Figure 2A</bold></xref>). While genes within some modules were associated with similar disease phenotypes (e.g. RCC1, RCC4), other modules appeared phenotypically more diverse (e.g. BCKDH, TCA). We then compared QPA of gene pairs within modules (n = 262 pairs) to pairs outside modules (n = 27,676 pairs). This analysis revealed a higher average phenotype similarity for gene pairs within versus outside the nine modules (p = 2.64e-5). We found a comparable result in the analysis of gene functional interactions, with on average higher LR for gene pairs within (n = 182) versus pairs outside these modules (n = 1,828; p = 1.86e-35). In summary, we identified positive correlations of functional (LR) and phenotypic (QPA) associations for many disease genes, with the most prominent genotype-phenotype relationships in protein complexes (<xref ref-type="fig" rid="pcbi-1000374-g002"><bold>Figure 2B</bold></xref><bold>)</bold>. These results support findings of a recent study that utilized automated text mining in OMIM to identify phenotypic similarities within protein complexes <xref ref-type="bibr" rid="pcbi.1000374-Lage1">[32]</xref>. However, it should be noted that OMIM often combines genes into a single disease record, if they encode subunits of the same protein complex (e.g. BCKDH - Maple syrup urine disease, #248600; GCC - Glycine encephalopathy, #605899). Potential circular reasoning in correlating phenotypes and complexes could be reduced by individual disease gene annotations. While statistically very significant, the genotype-phenotype correlation values observed in this and other studies are still rather small <xref ref-type="bibr" rid="pcbi.1000374-Braun1">[35]</xref>. Possible contributing factors are the imperfect information about gene-gene and gene-disease associations and the environment.</p>
<fig id="pcbi-1000374-g002" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.1000374.g002</object-id><label>Figure 2</label><caption>
<title>Phenotype similarity of genes related to mitochondrial protein complexes and pathways.</title>
<p>(A) For each gene (black dots), the average QPA (y-axis) to all other genes within a functional module was calculated. Red lines represent the median (50th percentile) of all QPA averages within a module. Boxes indicate the 25th and 75th quartiles, with minimum and maximum data points as lines that extend from each end of the box. The grand mean of all modules (blue line) is the QPA average across all gene pairs of all nine modules, which was significantly higher than for pairs outside modules (orange line). (B) Module gene relationships are predicted through functional (LR) and phenotypic (QPA) associations showing the usefulness of phenotype similarity scores in disease gene network analysis. The edge colors are: Red – gene pairs with highest correlation of QPA and LR; blue – gene pairs with lower QPA-LR correlation; orange and light blue – gene pairs with QPA only at higher (&gt; = 0.4) and lower confidence (&lt;0.4), respectively (see <xref ref-type="supplementary-material" rid="pcbi.1000374.s007">Table S4</xref> for data). Diseases caused by the six genes labeled “*” are known to respond to vitamin treatments (riboflavin, thiamine, and pyridoxine). Abbreviations: AKDH, Alpha ketoglutarate dehydrogenase; BCKDH, Branched chain alpha keto acid dehydrogenase; GCC, Glycine cleavage system; PDH, Pyruvate dehydrogenase; RCC, Respiratory chain complex; TCA, Tricarboxylic acid cycle; UC, Urea cycle.</p>
</caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.g002" xlink:type="simple"/></fig></sec><sec id="s2e">
<title>Functional interactions of nuclear-encoded mitochondrial genes</title>
<p>We then expanded our analysis and identified functional interactions for 162 disease genes (DG) to 4,577 candidate genes (CG) from a recent study <xref ref-type="bibr" rid="pcbi.1000374-Franke1">[34]</xref>. As for the DG, we also extracted all binary functional interactions for each CG in order to account for all genome-wide interactions of all 4,739 genes studied (<xref ref-type="supplementary-material" rid="pcbi.1000374.s008"><bold>Table S5</bold></xref>). Of the CG, 531 genes had disease associations in OMIM <xref ref-type="bibr" rid="pcbi.1000374-Hamosh1">[26]</xref> and we consequently labeled those as DG. We recorded in total more than 1.9 million gene interactions that included interactions between disease genes (DG-DG), disease and candidate genes (DG-CG, CG-DG), and candidate genes (CG-CG). We first focused on the mitochondrial gene network and identified a set of 495 mitochondrial CG through data integration of two recent studies <xref ref-type="bibr" rid="pcbi.1000374-Prokisch1">[5]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Calvo1">[36]</xref>. These studies combined had predicted 1,200 human mitochondrial genes (<xref ref-type="supplementary-material" rid="pcbi.1000374.s009"><bold>Table S6</bold></xref>). Our analysis of functional interactions of all mitochondrial CG (495) and DG (162) showed the following results: i. the total number of interactions (i[all-genes]), which is recorded to all human genes, was higher for CG than for DG (p = 7.93e-6); ii. the relative number of DG interactions (i[disease-genes]/i[all-genes]), which was recorded to all known human DG, was higher for DG than for CG (p = 6.37e-7); and iii. the relative number of interactions to human orthologs of mouse (i[mouse-essential]/i[all-genes]) and yeast (i[yeast-essential]/i[all-genes]) essential genes <xref ref-type="bibr" rid="pcbi.1000374-Goh1">[33]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Giaever1">[37]</xref> was higher for the DG than the CG (mouse p = 1.72e-4; yeast p = 0.013). These results indicated that mitochondrial CG and DG can be distinguished based on functional interaction patterns.</p>
<p>In a related analysis, we compared the functional interactions of DG (493) and CG (3551) located outside the mitochondrial organelle (<xref ref-type="table" rid="pcbi-1000374-t002"><bold>Table 2</bold></xref>), which showed similar results (i., ii. and iii.) as for the mitochondrial gene groups (see <xref ref-type="sec" rid="s4">Methods</xref> for data). However, the comparison of mitochondrial and non-mitochondrial genes revealed some surprises. The total number of interactions for non-mitochondrial DG was higher than for mitochondrial DG (p = 6.5e-29), and the number of interactions for non-mitochondrial CG was higher than for mitochondrial CG (p = 2.37e-93). Notably, the non-mitochondrial DG had on average more interactions than the mitochondrial CG (p = 1.87e-19). To further investigate these differences, we literature-annotated detailed information on intracellular localizations of gene products (<xref ref-type="supplementary-material" rid="pcbi.1000374.s004"><bold>Table S1</bold></xref>). Out of the 162 DG, 115 genes had only evidence for mitochondrial localizations, while 47 DG also localized to additional compartments (e.g. nucleus, cytoplasm). In addition, we identified 38 DG out of the 4,577 CG (<xref ref-type="supplementary-material" rid="pcbi.1000374.s009"><bold>Table S6</bold></xref>) with likely mitochondrial localizations <xref ref-type="bibr" rid="pcbi.1000374-Prokisch1">[5]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Calvo1">[36]</xref>. These 38 DG (p = 0.06) and the 47 DG with multiple localizations (p = 0.51) tended to have more interactions than the 115 mitochondria-only DG although both results were not statistically significant. In summary, our analysis identified a higher average connectivity for non-disease genes (CG) than for DG, which was detected for both mitochondrial and non-mitochondrial genes, and secondly, fewer functional interactions of mitochondrial than for non-mitochondrial genes. These findings are supported by a separate gene fraction analysis (<xref ref-type="fig" rid="pcbi-1000374-g003"><bold>Figure 3</bold></xref>), where we studied the number of interactions of genes in the different gene groups and the distribution of these interactions over the whole network (see <xref ref-type="sec" rid="s4">Methods</xref>).</p>
<fig id="pcbi-1000374-g003" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.1000374.g003</object-id><label>Figure 3</label><caption>
<title>Functional interactions of human mitochondrial genes.</title>
<p>For each gene group, we calculated the fraction of genes (y-axis) that interact with k other genes (x-axis). The gene group fractions were calculated for interactions to all human genes (A), all disease genes (B), and all mitochondrial genes (C). The color codes of the gene groups with their respective regression line slopes and p-values (in parenthesis) are shown in the table (D), with all results including correlation coefficients listed in <xref ref-type="supplementary-material" rid="pcbi.1000374.s010">Table S7</xref>. The fraction analysis of all gene interactions (A) showed a higher network connectivity for non-disease genes (CG) than for disease genes (DG), as indicated by the larger absolute value of the negative DG regression slope. In contrast, the connectivity to disease genes is relatively higher for DG than for CG suggesting a tendency for DG to interact with each other (B). Human orthologs to mouse essential genes had the highest network connectivity, while the mitochondrial gene groups had the highest tendency to interact to other mitochondrial genes (C).</p>
</caption><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.g003" xlink:type="simple"/></fig><table-wrap id="pcbi-1000374-t002" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.1000374.t002</object-id><label>Table 2</label><caption>
<title>Molecular interactions of mitochondria and non-mitochondria genes.</title>
</caption><!--===== Grouping alternate versions of objects =====--><alternatives><graphic id="pcbi-1000374-t002-2" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.t002" xlink:type="simple"/><table><colgroup span="1"><col align="left" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/></colgroup>
<thead>
<tr>
<td align="left" colspan="1" rowspan="1">Gene group (genes/group)</td>
<td align="left" colspan="1" rowspan="1">i[all-genes]</td>
<td align="left" colspan="1" rowspan="1">i[disease-genes]</td>
<td align="left" colspan="1" rowspan="1">i[mouse-essential]</td>
<td align="left" colspan="1" rowspan="1">i[yeast-essential]</td>
<td align="left" colspan="1" rowspan="1">i[mito-genes]</td>
</tr>
</thead>
<tbody>
<tr>
<td align="left" colspan="1" rowspan="1">DG mitochondria (162)</td>
<td align="left" colspan="1" rowspan="1">120.91 (62)</td>
<td align="left" colspan="1" rowspan="1">26.14 (17.5)</td>
<td align="left" colspan="1" rowspan="1">13.23 (6)</td>
<td align="left" colspan="1" rowspan="1">20.56 (8.5)</td>
<td align="left" colspan="1" rowspan="1">42.24 (22)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">CG mitochondria (495)</td>
<td align="left" colspan="1" rowspan="1">190.19 (114)</td>
<td align="left" colspan="1" rowspan="1">23.93 (14)</td>
<td align="left" colspan="1" rowspan="1">14.75 (6)</td>
<td align="left" colspan="1" rowspan="1">36.51 (23)</td>
<td align="left" colspan="1" rowspan="1">49.81(37)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">DG non-mitochondria (493)</td>
<td align="left" colspan="1" rowspan="1">396.71 (154)</td>
<td align="left" colspan="1" rowspan="1">48.29 (22)</td>
<td align="left" colspan="1" rowspan="1">75.01 (17)</td>
<td align="left" colspan="1" rowspan="1">29.86 (19)</td>
<td align="left" colspan="1" rowspan="1">16.91 (8)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">CG non-mitochondria (3551)</td>
<td align="left" colspan="1" rowspan="1">459.74 (275)</td>
<td align="left" colspan="1" rowspan="1">48.81 (21)</td>
<td align="left" colspan="1" rowspan="1">78.4 (21)</td>
<td align="left" colspan="1" rowspan="1">44.48 (34)</td>
<td align="left" colspan="1" rowspan="1">21.38 (10)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">DG mito-only local. (115)</td>
<td align="left" colspan="1" rowspan="1">114.48 (67)</td>
<td align="left" colspan="1" rowspan="1">27.23 (19)</td>
<td align="left" colspan="1" rowspan="1">10.68 (6)</td>
<td align="left" colspan="1" rowspan="1">20.14 (9)</td>
<td align="left" colspan="1" rowspan="1">48.07 (25)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">DG mito+other local. (47)</td>
<td align="left" colspan="1" rowspan="1">136.66 (56)</td>
<td align="left" colspan="1" rowspan="1">23.47 (14)</td>
<td align="left" colspan="1" rowspan="1">19.47 (7)</td>
<td align="left" colspan="1" rowspan="1">21.57 (6)</td>
<td align="left" colspan="1" rowspan="1">27.98 (18)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">DG mito-predict local. (38)</td>
<td align="left" colspan="1" rowspan="1">192 (107)</td>
<td align="left" colspan="1" rowspan="1">31.18 (18)</td>
<td align="left" colspan="1" rowspan="1">22.03 (9)</td>
<td align="left" colspan="1" rowspan="1">36.13 (15)</td>
<td align="left" colspan="1" rowspan="1">45.76 (30)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Mouse essential genes (597)</td>
<td align="left" colspan="1" rowspan="1">598.22 (480)</td>
<td align="left" colspan="1" rowspan="1">69.64 (52)</td>
<td align="left" colspan="1" rowspan="1">116.7 (63)</td>
<td align="left" colspan="1" rowspan="1">39.94 (30)</td>
<td align="left" colspan="1" rowspan="1">17.31 (8)</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Yeast essential genes (609)</td>
<td align="left" colspan="1" rowspan="1">354.96 (230)</td>
<td align="left" colspan="1" rowspan="1">33.51 (18)</td>
<td align="left" colspan="1" rowspan="1">40.51 (16)</td>
<td align="left" colspan="1" rowspan="1">66.15 (54)</td>
<td align="left" colspan="1" rowspan="1">37.03 (25)</td>
</tr>
</tbody>
</table></alternatives><table-wrap-foot><fn id="nt102"><p>The total 4,739 genes studied are separated into nine gene groups with the number of disease genes (DG) and candidate genes (CG) in each group in parenthesis (see <xref ref-type="supplementary-material" rid="pcbi.1000374.s008"><bold>Table S5</bold></xref> for individual gene data). DG products with intracellular localization to only mitochondria (115 genes) and mitochondria-and-other-localizations (47 genes) are subsets of the 162 mitochondrial DG. The human orthologs to mouse and yeast essential genes are subsets of all 4,739 genes. The five data columns show the average number of interactions (i) of each group to all genes in the human genome (all-genes); all known human disease genes (disease-genes); all human orthologs of essential mouse genes (mouse-essential); all human orthologs of essential yeast genes; and to all nuclear-encoded human mitochondrial genes (mito-genes). The numbers in parenthesis show the median number of interactions for each group and attribute, respectively. The findings indicated distinct properties in gene molecular interactions for DG and CG, as well as for mitochondria and non-mitochondria genes.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2f">
<title>Candidate genes for mitochondrial disorders</title>
<p>In the last decade, several systematic studies have predicted functional candidate genes in genomic linkage intervals of mitochondrial diseases <xref ref-type="bibr" rid="pcbi.1000374-Tiranti1">[38]</xref>–<xref ref-type="bibr" rid="pcbi.1000374-Spinazzola1">[42]</xref>. In principle, all genes from a given interval are “benchmarked” against a database of annotated proteins <xref ref-type="bibr" rid="pcbi.1000374-Prokisch1">[5]</xref>, and genes identical to or functionally similar to the reference proteins are prioritized for mutational screens in affected individuals. Here, we build on the success of these approaches and predict new DG from a larger list of mitochondrial CG. Considering the identified interaction differences of disease and non-disease genes, we performed a supervised discriminant analysis <xref ref-type="bibr" rid="pcbi.1000374-1">[43]</xref> of all 695 mitochondrial genes using the five attributes of gene functional interactions (<xref ref-type="supplementary-material" rid="pcbi.1000374.s008"><bold>Table S5</bold></xref>). Out of the 495 mitochondrial CG, 254 genes were predicted as DG with a true positive rate of 80.2% based on the confirmed known DG. In addition, 26 of the 38 DG with likely mitochondrial localization, which we input-labeled as CG to serve as controls, were correctly classified as DG. As an alternative tool, we ran a supervised Bayesian network approach <xref ref-type="bibr" rid="pcbi.1000374-httpwww.cs.waikato.ac.nzremcowekabn1">[44]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Witten1">[45]</xref>. We first defined a training set of 100 typical out of the 162 mitochondrial DG based on their median of total gene interactions. Accordingly, 100 typical CG were selected from the 495 mitochondrial CG. The network analysis correctly identified 56.8% of the DG, 16 out of the 38 likely mitochondrial DG, and predicted 201 DG out of the 495 CG. Overlapping the two approaches predicted 168 novel mitochondrial DG with an estimated true positive rate of 85.8% (139 out of 162 DG) based on the correctly classified DG (<xref ref-type="supplementary-material" rid="pcbi.1000374.s011"><bold>Table S8</bold></xref>). The newly predicted disease candidates can be prioritized from the larger set of functional CG in linkage intervals of mitochondrial disorders (<xref ref-type="table" rid="pcbi-1000374-t003"><bold>Table 3</bold></xref>).</p>
<table-wrap id="pcbi-1000374-t003" position="float"><object-id pub-id-type="doi">10.1371/journal.pcbi.1000374.t003</object-id><label>Table 3</label><caption>
<title>Prioritizing candidate genes for mitochondrial disorders.</title>
</caption><!--===== Grouping alternate versions of objects =====--><alternatives><graphic id="pcbi-1000374-t003-3" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.t003" xlink:type="simple"/><table><colgroup span="1"><col align="left" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/><col align="center" span="1"/></colgroup>
<thead>
<tr>
<td align="left" colspan="1" rowspan="1">Mitochondrial Disorder</td>
<td align="left" colspan="1" rowspan="1">OMIM</td>
<td align="left" colspan="1" rowspan="1">Phenotypic features</td>
<td align="left" colspan="1" rowspan="1">Linkage interval</td>
<td align="left" colspan="1" rowspan="1">Size (Mb)</td>
<td align="left" colspan="1" rowspan="1">Gene loci</td>
<td align="left" colspan="1" rowspan="1">Mitochondrial genes marked (*) if known, and (<sup>#</sup>) if predicted disease gene</td>
</tr>
</thead>
<tbody>
<tr>
<td align="left" colspan="1" rowspan="1">Optic atrophy 2, OPA2</td>
<td align="left" colspan="1" rowspan="1">311050</td>
<td align="left" colspan="1" rowspan="1">optic nerve disease</td>
<td align="left" colspan="1" rowspan="1">DXS993-DXS991</td>
<td align="left" colspan="1" rowspan="1">14.5</td>
<td align="left" colspan="1" rowspan="1">352</td>
<td align="left" colspan="1" rowspan="1">MAOA*, ALAS2*, <bold>HSD17B10*</bold>; MAOB<sup>#</sup>, <bold>NDUFB11<sup>#</sup></bold>, <bold>TIMM17B<sup>#</sup></bold>; ARAF</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Optic atrophy 4, OPA4</td>
<td align="left" colspan="1" rowspan="1">605293</td>
<td align="left" colspan="1" rowspan="1">optic nerve disease</td>
<td align="left" colspan="1" rowspan="1">D18S34-D18S479</td>
<td align="left" colspan="1" rowspan="1">8.8</td>
<td align="left" colspan="1" rowspan="1">58</td>
<td align="left" colspan="1" rowspan="1">ATP5A1<sup>#</sup>, <bold>ACAA2<sup>#</sup></bold></td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Optic atrophy 5, OPA5</td>
<td align="left" colspan="1" rowspan="1">610708</td>
<td align="left" colspan="1" rowspan="1">optic nerve disease</td>
<td align="left" colspan="1" rowspan="1">D22S1148-D22S283</td>
<td align="left" colspan="1" rowspan="1">10.4</td>
<td align="left" colspan="1" rowspan="1">189</td>
<td align="left" colspan="1" rowspan="1">HSCB<sup>#</sup>, PISD<sup>#</sup>, <bold>TXN2<sup>#</sup></bold>, <bold>UCRC<sup>#</sup></bold>, <bold>TST<sup>#</sup></bold>; NIPSNAP1, MTP18</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Optic atrophy 6, OPA6</td>
<td align="left" colspan="1" rowspan="1">258500</td>
<td align="left" colspan="1" rowspan="1">optic nerve disease</td>
<td align="left" colspan="1" rowspan="1">D8S1702-D8S1794</td>
<td align="left" colspan="1" rowspan="1">12.3</td>
<td align="left" colspan="1" rowspan="1">86</td>
<td align="left" colspan="1" rowspan="1">UQCRB*, DECR1* PPM2C*; SLC7A13<sup>#</sup>; SLC7A13, FAM82B, MTERFD1</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Thyroid carcinoma, nonmedullary, TCO</td>
<td align="left" colspan="1" rowspan="1">601992</td>
<td align="left" colspan="1" rowspan="1">thyroid neoplasms</td>
<td align="left" colspan="1" rowspan="1">D19S884-D19S221</td>
<td align="left" colspan="1" rowspan="1">4.5</td>
<td align="left" colspan="1" rowspan="1">153</td>
<td align="left" colspan="1" rowspan="1">TIMM44<sup>#</sup>, <bold>NDUFA7<sup>#</sup></bold>; MRPL4, FDX1L, ECSIT</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Paragangliomas 2, PGL2</td>
<td align="left" colspan="1" rowspan="1">601650</td>
<td align="left" colspan="1" rowspan="1">neuroendocrine tumors</td>
<td align="left" colspan="1" rowspan="1">D11S956-PYGM</td>
<td align="left" colspan="1" rowspan="1">6.0</td>
<td align="left" colspan="1" rowspan="1">193</td>
<td align="left" colspan="1" rowspan="1">BAD<sup>#</sup>, PRDX5<sup>#</sup>, GLYAT<sup>#</sup>, <bold>C11orf79<sup>#</sup></bold>, <bold>COX8A<sup>#</sup></bold>; MRPL16, GLYATL1, GLYATL2</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Multiple mitochon-drial dysfunction syndrome, MMDFS</td>
<td align="left" colspan="1" rowspan="1">605711</td>
<td align="left" colspan="1" rowspan="1">muscle weakness, seizures, lethargy, feeding difficulties,</td>
<td align="left" colspan="1" rowspan="1">D2S1337-D2S441</td>
<td align="left" colspan="1" rowspan="1">8.8</td>
<td align="left" colspan="1" rowspan="1">79</td>
<td align="left" colspan="1" rowspan="1"><bold>MDH1<sup>#</sup></bold>; CCT4, ENSG00000119838</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Cowchock syndrome; NADMR</td>
<td align="left" colspan="1" rowspan="1">310490</td>
<td align="left" colspan="1" rowspan="1">muscle weakness, mental retardation, hearing disorder, polyneuropathy</td>
<td align="left" colspan="1" rowspan="1">DXS425-HPRT</td>
<td align="left" colspan="1" rowspan="1">13.7</td>
<td align="left" colspan="1" rowspan="1">152</td>
<td align="left" colspan="1" rowspan="1"><bold>NDUFA1*</bold>; <bold>AIFM1<sup>#</sup>, GLUD2<sup>#</sup>, SLC25A14<sup>#</sup></bold></td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">MEHMO syndrome</td>
<td align="left" colspan="1" rowspan="1">300148</td>
<td align="left" colspan="1" rowspan="1">mental retardation, seizures, obesity, hypogonadism</td>
<td align="left" colspan="1" rowspan="1">DXS365-CYBB</td>
<td align="left" colspan="1" rowspan="1">15.9</td>
<td align="left" colspan="1" rowspan="1">139</td>
<td align="left" colspan="1" rowspan="1"><bold>GK*</bold>; ACOT9<sup>#</sup>, PDK3<sup>#</sup>; APOO</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Gustavson syndrome, GUST</td>
<td align="left" colspan="1" rowspan="1">309555</td>
<td align="left" colspan="1" rowspan="1">mental retardation, optic nerve disease, seizures, deafness</td>
<td align="left" colspan="1" rowspan="1">DXS458-DXS424</td>
<td align="left" colspan="1" rowspan="1">20.2</td>
<td align="left" colspan="1" rowspan="1">285</td>
<td align="left" colspan="1" rowspan="1">ACSL4*, <bold>TIMM8A*</bold>; MCART6, SLC25A5, SLC25A43</td>
</tr>
<tr>
<td align="left" colspan="1" rowspan="1">Spastic paraplegia, SPG9</td>
<td align="left" colspan="1" rowspan="1">601162</td>
<td align="left" colspan="1" rowspan="1">paralysis-paresis, cataract, vomiting, foot deformities</td>
<td align="left" colspan="1" rowspan="1">D10S564-D10S603</td>
<td align="left" colspan="1" rowspan="1">9.4</td>
<td align="left" colspan="1" rowspan="1">166</td>
<td align="left" colspan="1" rowspan="1">COX15*, <bold>ALDH18A1*</bold>; NDUFB8<sup>#</sup>, GOT1<sup>#</sup>; C10orf65, SLC25A28</td>
</tr>
</tbody>
</table></alternatives><table-wrap-foot><fn id="nt103"><p>For each mitochondrial disorder (col.1), we identified the mitochondrial candidate genes (col.7) among all gene loci (col.6) in the genomic linkage interval (col.4). The mitochondrial genes are further sorted into: (*) known disease genes with genes (in bold) causing phenotypic features (col.3) similar to features linked to the disease interval; and (<sup>#</sup>) predicted disease genes with genes (in bold) that interact to known disease genes causing features similar to the disease interval features. For completeness, the unlabeled mitochondrial genes are not known or predicted disease genes.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s3">
<title>Discussion</title>
<p>The creation of human phenomic databases has been suggested to systematically collect and analyze phenotypic information <xref ref-type="bibr" rid="pcbi.1000374-Freimer1">[15]</xref>, <xref ref-type="bibr" rid="pcbi.1000374-Singer1">[20]</xref>–<xref ref-type="bibr" rid="pcbi.1000374-Sabb1">[22]</xref>. In this study, we established a clinical phenotype catalog of 174 mitochondrial disease genes (<xref ref-type="table" rid="pcbi-1000374-t001"><bold>Table 1</bold></xref>) that account for ∼10% of all known disease genes <xref ref-type="bibr" rid="pcbi.1000374-Hamosh1">[26]</xref>. In order to define and classify clinical phenotypes from 1,636 medical case reports, we developed a terminologic system that is based on the hierarchical MeSH ontology. Because automated text mining is limited in annotating clinical disorders from the literature <xref ref-type="bibr" rid="pcbi.1000374-Nadkarni1">[18]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-vanDriel1">[19]</xref>, our mapping of “phenotypes to language” required the manual review of each full-text article <xref ref-type="bibr" rid="pcbi.1000374-Biesecker1">[17]</xref>. This classification of phenotypic features for each gene allowed the comparison of disorders between different disease genes (<xref ref-type="fig" rid="pcbi-1000374-g001"><bold>Figure 1</bold></xref>). To measure clinical phenotype similarity between disease genes, we calculated a numerical value (QPA, quantitative phenotypic associations) that takes into account all annotated gene-feature associations, the overlap of features between two disease genes, and the frequency of the shared feature across all genes. Thus, QPA are based on the hypothesis that the value of a feature varies inversely with the number of genes with which it is associated <xref ref-type="bibr" rid="pcbi.1000374-Brunner1">[16]</xref>.</p>
<p>The analysis of disease gene pairs with QPA in comparison to Likelihood Ratios (LR) for functional interactions <xref ref-type="bibr" rid="pcbi.1000374-Franke1">[34]</xref> showed positive correlations. Disease genes with stronger evidence for functional interactions (higher LR) displayed greater similarities in their clinical phenotypes (higher QPA). We discovered the most prominent phenotypic similarities within mitochondrial protein complexes (<xref ref-type="fig" rid="pcbi-1000374-g002"><bold>Figure 2</bold></xref>) supporting previously predicted genotype-phenotype associations of protein complexes <xref ref-type="bibr" rid="pcbi.1000374-Lage1">[32]</xref>. However, we also noted complexes with lower phenotypic similarities (e.g. BCKDH - Maple syrup urine disease; GCC - Glycine encephalopathy) highlighting the importance for individual gene inspection. Since this analysis was limited to disease genes (DG), we were interested in learning the properties of a larger network that included non-disease candidate genes (CG). Utilizing the genome-wide study by Franke et al. <xref ref-type="bibr" rid="pcbi.1000374-Franke1">[34]</xref>, we created a functional network of more than 1.9 million gene interactions for 162 mitochondrial DG and 4,577 CG. Our analysis identified significant differences in functional interactions for DG and CG with a higher average connectivity for CG. This difference was detected for both the mitochondrial and non-mitochondrial gene groups (<xref ref-type="table" rid="pcbi-1000374-t002"><bold>Table 2</bold></xref>). In addition, while the total number of DG interactions was similar for DG and CG, the relative fraction of DG interactions (i[disease-genes]/i[all-genes]) was higher for DG indicating that DG are more likely to interact with each other. Previous smaller scale studies (∼100× fewer interactions) have predicted intermediate and peripheral positions of DG in gene functional networks with relatively fewer interactions than essential genes <xref ref-type="bibr" rid="pcbi.1000374-Goh1">[33]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Feldman1">[46]</xref>. Our results expand on this hypothesis showing that essential and non-disease genes (CG) can be distinguished from DG based on gene interaction patterns (<xref ref-type="fig" rid="pcbi-1000374-g003"><bold>Figure 3</bold></xref>). Furthermore, we also identified network properties differentiating mitochondrial from non-mitochondrial genes. Mitochondrial genes showed a lower average connectivity, which may be due to the double-membrane structure of the organelle limiting the detection of protein-protein interactions <xref ref-type="bibr" rid="pcbi.1000374-Prokisch2">[47]</xref>. However, the higher connectivity between mitochondrial genes may relativize this problem. Future studies will help to answer the question of the connectivity of mitochondrial genes and perhaps genes of other cellular compartments as well.</p>
<p>In the final part of this study we utilized the discovered interaction patterns to predict new mitochondrial DG. Using two different approaches, we identified 168 non-disease genes that resembled the characteristic interaction patterns of the 162 mitochondrial DG (estimated TP rate = 85.8%). If diseases are linked to a genomic interval, the predicted DG can be prioritized from a larger list of functional candidates for mutational screen in affected individuals (<xref ref-type="table" rid="pcbi-1000374-t003"><bold>Table 3</bold></xref>). For example, the optic atrophy 2 (OPA2) linkage interval contains seven mitochondrial genes that include three known DG of which HSD17B10 is associated with optic atrophy <xref ref-type="bibr" rid="pcbi.1000374-Ensenauer1">[48]</xref>–<xref ref-type="bibr" rid="pcbi.1000374-PerezCerda1">[50]</xref>, and three predicted DG of which two genes (NDUFB11, TIMM17B) interact with mitochondrial DG causing optic atrophy. Our phenome knowledgebase (<ext-link ext-link-type="uri" xlink:href="http://www.mitophenome.org" xlink:type="simple">www.mitophenome.org</ext-link>) can also be applied to investigate disorders through gene network association, in particular common conditions that are caused by single gene defects in a subset of patients <xref ref-type="bibr" rid="pcbi.1000374-Lim1">[51]</xref>. For example, a search for Parkinson disease returns 12 mitochondrial DG with interactions to 24 predicted DG (e.g. CCS, MECR, PRKAR2B). Similarly, seizures and mental retardation, a common combination of mitochondrial features, is caused by 59 DG that interact with 124 predicted DG. With the decreasing cost of DNA sequencing, high-throughput screens linking phenotypes with genotypes will further increase the accuracy of gene-feature associations. To this end, easy navigation between clinical phenotype and gene information promises to aid in the recognition and diagnosis of mitochondrial disorders.</p>
</sec><sec id="s4">
<title>Methods</title>
<sec id="s4a">
<title>Mitochondrial disease genes</title>
<p>We identified 174 disease genes that encode proteins targeted to mitochondria (<xref ref-type="supplementary-material" rid="pcbi.1000374.s004"><bold>Table S1</bold></xref>). While most gene defects are inherited as Mendelian traits; ACSL6, BAX, BCL2, ME2, MTHFD1, PARL, PHB, UCP1, and UCP2 are disease susceptibility alleles; DLST, OGDH, and PCK2 are disease-associated protein deficiencies; and HTRA2, MTCP1, SLC25A16, and WWOX cause disorders of unknown inheritance patterns. <xref ref-type="supplementary-material" rid="pcbi.1000374.s004"><bold>Table S1</bold></xref> has also the annotations and PMID references (col. I) for intracellular protein localizations and the 39 genes encoding components of nine mitochondrial protein complexes and pathways (col. J). Additional mitochondrial genes (<xref ref-type="supplementary-material" rid="pcbi.1000374.s009"><bold>Table S6</bold></xref>) were identified through integration of two studies <xref ref-type="bibr" rid="pcbi.1000374-Prokisch1">[5]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Calvo1">[36]</xref> that had combined predicted 1,200 mitochondrial genes.</p>
</sec><sec id="s4b">
<title>Phenotypic feature annotation</title>
<p>For each of the 174 disease genes, we identified individual studies and case reports describing a gene defect or deficiency and associated phenotype information. Manual extraction and annotation probably results in more specific and comprehensive data, with far fewer false-positives than automated alternatives including natural language processing and high-throughput screening <xref ref-type="bibr" rid="pcbi.1000374-Calvano1">[23]</xref>. Annotation of 1,636 full-text articles identified 461 phenotypic features that included the definition of specific clinical terms for each feature. Features were defined narrowly enough so that clinical diagnoses mapped to a single feature. This process was essential as phenotype descriptions were not consistent and often varied between different studies (see <xref ref-type="supplementary-material" rid="pcbi.1000374.s006"><bold>Table S3</bold></xref>, col. E). To define features, we utilized standardized descriptors in the Medical Subject Headings (MeSH) database under the “Diseases” (coded under C), and the “Psychiatry and Psychology” (coded under F) branches of the MeSH hierarchy used by the National Library of Medicine (NLM). Individual matching of features with MeSH descriptors revealed their positions in the hierarchical MeSH ontology, together with the parent descriptor, the directly related hypernym feature. For this analysis, we assigned each feature to only one position in MeSH (e.g. diabetes mellitus has MeSH positions C18.452.394.750 and C19.246; we chose the first category). We only added hypernyms to the ontology that were directly related to at least two features. Some features were added manually because they had no clear match with MeSH descriptors. By integrating our 461 features with their 41 hypernyms, we identified 502 features that are hierarchically classified within the mitochondrial phenotype ontology (<xref ref-type="supplementary-material" rid="pcbi.1000374.s005"><bold>Table S2</bold></xref>).</p>
</sec><sec id="s4c">
<title>Gene-feature pair annotation</title>
<p>We used 1,636 full-text articles to manually annotate 6,361 gene-feature pairs, each of which was created from at least one original PubMed article with a unique identifier (PMID). On average, we identified 2.77 PMID per gene-feature pair, and 9.87 PMID per gene. Further, we assigned each gene-feature pair to a unique OMIM disease record (e.g. 277900 for Wilson disease), which described the disorder and was referenced in many articles. We computationally integrated the 6,361 gene-feature pairs with our phenotype ontology, resulting in 10,202 gene-feature pairs (<xref ref-type="supplementary-material" rid="pcbi.1000374.s006"><bold>Table S3</bold></xref>). This integration also assigned the PMID of each gene-feature pair to its directly related hypernym gene-feature pair. PMID assigned through ontology integration are labeled “#” (col. G). Because gene-feature pairs may be associated with more than one OMIM disease record, we consolidated the 10,202 gene-feature pairs (and their PMID) into 9,407 unique pairs. For example, the gene POLG is associated with ophthalmoplegia and three OMIM disease records (157640, 258450, 607459).</p>
</sec><sec id="s4d">
<title>Quantitative phenotypic associations (QPA)</title>
<p>The association ratio for each gene-feature pair is the fraction of PMID reporting a specific feature for a specific gene out of the total number of PMID annotated for that gene. The feature Fi specific association ratio for gene pair A–B (rFi) was calculated as:<disp-formula><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.e001" xlink:type="simple"/></disp-formula>We considered the important weight wi of feature Fi for gene pair A–B as:<disp-formula><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.e002" xlink:type="simple"/></disp-formula>where N is the total number of genes (174) and df_i is the document frequency of feature Fi in all genes, which is related to the Inverse Document Frequency (IDF). IDF reflects the hypothesis that the value of a feature varies inversely with the number of genes in which it occurs <xref ref-type="bibr" rid="pcbi.1000374-Brunner1">[16]</xref>. To adjust for different PMID counts for a feature in different genes, we set a denominator as the maximum number of PMID in one gene associated with this feature. QPA integrated the association ratios (ri) in all features Fi (i = 1, 2, 3, …, I) for gene pair A–B through weights of wi_max which was calculated as:<disp-formula><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.e003" xlink:type="simple"/></disp-formula></p>
<p>We identified feature Fi specific association ratios for 514,978 gene pairs (self-pairs removed), and computed QPA for 27,938 gene pairs with numerical values between 0.00177 and 1 (<xref ref-type="supplementary-material" rid="pcbi.1000374.s007"><bold>Table S4</bold></xref>). An example of calculating QPA for specific disease genes is given under <xref ref-type="supplementary-material" rid="pcbi.1000374.s001"><bold>Text S1</bold></xref>. In a related analysis, we studied associations of genes and features after removing eleven features that describe biochemical measurements of protein complexes (e.g. AKDH-deficiency, RCC1-deficiency). Removing these features resulted in 9,298 gene-feature pairs. We identified high correlations for QPA using the 9,298 versus all 9,407 gene-feature pairs, respectively (Kendall Cor = 0.9899, Spearman Cor = 0.9981, and Pearson Cor = 0.9978). While biochemical measurements support the diagnosis of many mitochondrial diseases, these features may not be essential for QPA predictions.</p>
</sec><sec id="s4e">
<title>Correlation of QPA and gene functional interactions</title>
<p>We extracted 2,010 disease gene pairs (140 genes) from a recent study that had integrated microarray co-expression, human and orthologous protein-protein interactions, and Gene Ontology (GO) similarities into Likelihood Ratios (LR) for gene functional interactions <xref ref-type="bibr" rid="pcbi.1000374-Franke1">[34]</xref>. LR ranged from 1.1 to 2,374,581 and we used a linear transformation for LR to fall into a range between 0 and 1:<disp-formula><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.e004" xlink:type="simple"/></disp-formula></p>
<p>Overlapping all disease gene pairs with predictions for both LR and QPA revealed 1,928 pairs (<xref ref-type="supplementary-material" rid="pcbi.1000374.s007"><bold>Table S4</bold></xref>). Two-sided tests of uniform distribution of LR and QPA for these pairs revealed non-uniform distribution with p values of 2.2e-16 (significance level: 0.05). Rank correlation of LR and QPA for the 1,928 gene pairs showed positive association with significant confidence: Kendall (Cor = 0.077; p = 4.67e-7), Spearman (Cor = 0.115; p = 3.72e-7), and Pearson (Cor = 0.145; p = 1.59e-10). Bivariate analysis and Lowess plots further confirmed this finding (<xref ref-type="supplementary-material" rid="pcbi.1000374.s002"><bold>Figure S1</bold></xref>). In addition, we applied Euclidian distance and hierarchical average linkage clustering (<ext-link ext-link-type="uri" xlink:href="http://www.r-project.org" xlink:type="simple">http://www.r-project.org</ext-link>) and identified six gene clusters with higher to lower association of LR and QPA (<xref ref-type="supplementary-material" rid="pcbi.1000374.s003"><bold>Figure S2</bold></xref> and <xref ref-type="supplementary-material" rid="pcbi.1000374.s007"><bold>Table S4</bold></xref>).</p>
</sec><sec id="s4f">
<title>Functional interactions of nuclear-encoded mitochondrial genes</title>
<p>Out of the 174 DG, we identified functional interactions for 162 DG to 4,577 CG from a recent study <xref ref-type="bibr" rid="pcbi.1000374-Franke1">[34]</xref>. As for the 162 DG, we also recorded all genome-wide binary interactions for the 4,577 CG with a total of 1,949,132 interactions. All gene interactions are non-redundant and non-self-interacting. The interactions for the 4,577 CG included interactions to additional 5,358 genes that we labeled CG interactors (CGin). We assigned the following four attributes to the total 10,097 genes that included DG, CG and CGin (<xref ref-type="supplementary-material" rid="pcbi.1000374.s009"><bold>Table S6</bold></xref>): i. 1,283 disease genes identified through OMIM <xref ref-type="bibr" rid="pcbi.1000374-Hamosh1">[26]</xref>; ii. 1,032 human orthologs to mouse essential genes <xref ref-type="bibr" rid="pcbi.1000374-Goh1">[33]</xref>; iii. 977 human orthologs to yeast essential genes <xref ref-type="bibr" rid="pcbi.1000374-Giaever1">[37]</xref>; and iv. 863 nuclear-encoded mitochondrial genes through integrative analysis of two studies <xref ref-type="bibr" rid="pcbi.1000374-Prokisch1">[5]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Calvo1">[36]</xref>. We then computed for each DG (162) and CG (4,577) the total number of interactions (i[all-genes]), as well as all interactions to genes with the assigned attributes (i–iv). <xref ref-type="supplementary-material" rid="pcbi.1000374.s008"><bold>Table S5</bold></xref> lists all genome-wide interactions for the 4,739 genes (col. C) and interactions to genes with the four attributes (col. D–G).</p>
</sec><sec id="s4g">
<title>Functional interactions of non-mitochondrial genes</title>
<p>The analysis of interactions of the non-mitochondrial CG (3551) and DG (493) showed the following results: i. the total number of interactions (i[all-genes]), which is recorded to all genes in the human genome, was higher for CG than for DG (p = 3.67e-3); ii. the relative number of DG interactions (i[disease-genes]/i[all-genes]), which was recorded to all known human DG, was higher for DG than for CG (p = 1.07e-21); and iii. the relative number of interactions to human orthologs of mouse (i[mouse-essential]/i[all-genes]) and yeast (i[yeast-essential]/i[all-genes]) essential genes <xref ref-type="bibr" rid="pcbi.1000374-Goh1">[33]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Giaever1">[37]</xref> was higher for the DG than the CG (mouse p = 3.77e-4; yeast p = 7.62e-7).</p>
</sec><sec id="s4h">
<title>Gene fraction analysis</title>
<p>We studied the number of interactions (degree) of genes in the different gene groups and the probability distribution of these interactions (degree distribution) over the whole network. For each gene group, we computed the degree distributions P(k) as the fraction of the number of genes that interact with k other genes, where the sum of fractions of a specific gene group is 1. Similar to the study by Goh et al. <xref ref-type="bibr" rid="pcbi.1000374-Goh1">[33]</xref>, we used log2k as the dependent variable in <xref ref-type="fig" rid="pcbi-1000374-g003"><bold>Figure 3</bold></xref>. We calculated P(k) for interactions of each gene group to all human genes (<bold>3A</bold>), all human disease genes (<bold>3B</bold>) and all mitochondrial genes (<bold>3C</bold>) using data in <xref ref-type="supplementary-material" rid="pcbi.1000374.s008"><bold>Table S5</bold></xref>. We then performed a fraction analysis by applying the linear regression model to the degree distributions of each gene group and attribute using the R statistical package (<ext-link ext-link-type="uri" xlink:href="http://www.r-project.org" xlink:type="simple">http://www.r-project.org</ext-link>) and calculated the values for the regression line slopes, their p-values and correlation coefficients (<xref ref-type="supplementary-material" rid="pcbi.1000374.s010"><bold>Table S7</bold></xref>). We found that the measured trends described by the linear regression model are statistically significant for all gene groups with very small p-values (&lt;10<sup>−8</sup>), which we obtained by testing the null hypothesis that the slope is zero. The negative regression slopes identified for all gene groups suggested a relatively higher portion of less-connected genes and a lower tendency to form a hub structure. We then ordered the gene groups using their slope values. The order was based on the hypothesis that as larger the absolute value of the negative regression slope, the higher the probability that lower-connected genes outnumber the higher-connected genes. This comparison showed that in the interactions to all genes (<bold>3A</bold>), DG mito showed relatively fewer interactions (−0.00142) than CG mito (−0.00072), and in the interactions to all disease genes (<bold>3B</bold>), DG mito showed relatively more interactions (−0.00612) than CG mito (−0.00776). Similar relationships were found in the comparison of the mitochondrial gene groups based on their correlation coefficients (<xref ref-type="supplementary-material" rid="pcbi.1000374.s010"><bold>Table S7</bold></xref>). We concluded from these results that while mitochondrial disease genes displayed an overall smaller connectivity, they showed a tendency to interact with each other suggesting the formation of disease gene hubs in the periphery of the mitochondrial gene networks.</p>
</sec><sec id="s4i">
<title>Candidate genes for mitochondrial disorders</title>
<p>We applied the two supervised methods of discriminant analysis <xref ref-type="bibr" rid="pcbi.1000374-1">[43]</xref> and Bayesian network analysis <xref ref-type="bibr" rid="pcbi.1000374-httpwww.cs.waikato.ac.nzremcowekabn1">[44]</xref>,<xref ref-type="bibr" rid="pcbi.1000374-Witten1">[45]</xref> to predict new mitochondrial DG. From <xref ref-type="supplementary-material" rid="pcbi.1000374.s008"><bold>Table S5</bold></xref>, we selected 695 mitochondrial genes and their attributes of functional interactions and labeled the 162 DG as DG, the 495 CG as CG, and the 38 likely mitochondrial DG as CG to serve as controls. The linear discriminant covariance analysis was performed using the JMP statistical software with predictions results listed in <xref ref-type="supplementary-material" rid="pcbi.1000374.s011"><bold>Table S8</bold></xref> (col. D–I). For the Bayesian network analysis (col. K–P), we first selected 100 typical DG out of the 162 DG, and 100 typical CG out of the 495 CG (col. K). The 200 genes were imported as training sets into a machine-learning algorithm and the Bayesian network package of this program was used to train the model by the method of cross validation <xref ref-type="bibr" rid="pcbi.1000374-httpwww.cs.waikato.ac.nzremcowekabn1">[44]</xref>. We then imported the test set of all 695 mitochondrial genes in order to predict mitochondrial DG. The overlap of the two applied methods (col. Q) predicted 168 high-probability disease candidate genes out of the 495 non-disease CG.</p>
</sec><sec id="s4j">
<title>Author information</title>
<p>The accompanying mitochondrial phenome knowledgebase is available at <ext-link ext-link-type="uri" xlink:href="http://www.mitophenome.org" xlink:type="simple">http://www.mitophenome.org</ext-link></p>
</sec></sec><sec id="s5">
<title>Supporting Information</title>
<supplementary-material id="pcbi.1000374.s001" mimetype="application/msword" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s001" xlink:type="simple"><label>Text S1</label><caption>
<p>(0.03 MB DOC)</p>
</caption></supplementary-material><supplementary-material id="pcbi.1000374.s002" mimetype="application/msword" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s002" xlink:type="simple"><label>Figure S1</label><caption>
<p>Lowess plot for the correlation of disease gene pairs predicted by LR and QPA.</p>
<p>(0.04 MB DOC)</p>
</caption></supplementary-material><supplementary-material id="pcbi.1000374.s003" mimetype="application/msword" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s003" xlink:type="simple"><label>Figure S2</label><caption>
<p>Clustering of 1,928 disease gene-pairs with LR and QPA.</p>
<p>(0.08 MB DOC)</p>
</caption></supplementary-material><supplementary-material id="pcbi.1000374.s004" mimetype="application/x-excel" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s004" xlink:type="simple"><label>Table S1</label><caption>
<p>174 nuclear-encoded mitochondrial disease genes</p>
<p>(0.09 MB XLS)</p>
</caption></supplementary-material><supplementary-material id="pcbi.1000374.s005" mimetype="application/x-excel" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s005" xlink:type="simple"><label>Table S2</label><caption>
<p>502 phenotypic features in mitochondrial disease phenotype ontology</p>
<p>(0.06 MB XLS)</p>
</caption></supplementary-material><supplementary-material id="pcbi.1000374.s006" mimetype="application/x-excel" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s006" xlink:type="simple"><label>Table S3</label><caption>
<p>9,407 annotated gene-feature associations</p>
<p>(1.90 MB XLS)</p>
</caption></supplementary-material><supplementary-material id="pcbi.1000374.s007" mimetype="application/x-excel" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s007" xlink:type="simple"><label>Table S4</label><caption>
<p>27,938 QPA of disease gene pairs incl. 1,928 pairs with QPA and LR</p>
<p>(3.78 MB XLS)</p>
</caption></supplementary-material><supplementary-material id="pcbi.1000374.s008" mimetype="application/x-excel" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s008" xlink:type="simple"><label>Table S5</label><caption>
<p>4,739 genes in functional network analysis and their 5 interaction attributes</p>
<p>(0.54 MB XLS)</p>
</caption></supplementary-material><supplementary-material id="pcbi.1000374.s009" mimetype="application/x-excel" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s009" xlink:type="simple"><label>Table S6</label><caption>
<p>10,097 genes with LR interactions (DG, CG, and CG interactors)</p>
<p>(0.80 MB XLS)</p>
</caption></supplementary-material><supplementary-material id="pcbi.1000374.s010" mimetype="application/x-excel" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s010" xlink:type="simple"><label>Table S7</label><caption>
<p>Gene fraction analysis results</p>
<p>(0.01 MB XLS)</p>
</caption></supplementary-material><supplementary-material id="pcbi.1000374.s011" mimetype="application/x-excel" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1000374.s011" xlink:type="simple"><label>Table S8</label><caption>
<p>695 mitochondrial genes including newly predicted disease candidate genes.</p>
<p>(0.20 MB XLS)</p>
</caption></supplementary-material></sec></body>
<back>
<ack>
<p>We thank Lior David, Michael Mindrinos, and Uta Francke for questions and comments, Zhenglong Gu for aiding in the collaborations, Curtis Palm, Jengnan Tzeng, Tai-Been Chen, Chun-Jui Chen and Monika Trebo for help in preparing supplemental material, Marc Vidal and Kwang-Il Goh for providing mouse-lethal human orthologs, and Shayna Roosevelt for manuscript editing.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pcbi.1000374-Luft1"><label>1</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Luft</surname><given-names>R</given-names></name>
</person-group>             <year>1994</year>             <article-title>The development of mitochondrial medicine.</article-title>             <source>Proc Natl Acad Sci U S A</source>             <volume>91</volume>             <fpage>8731</fpage>             <lpage>8738</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-DiMauro1"><label>2</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>DiMauro</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Schon</surname><given-names>EA</given-names></name>
</person-group>             <year>1998</year>             <article-title>Nuclear power and mitochondrial disease.</article-title>             <source>Nature Genetics</source>             <volume>19</volume>             <fpage>214</fpage>             <lpage>215</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Wallace1"><label>3</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Wallace</surname><given-names>DC</given-names></name>
</person-group>             <year>2005</year>             <article-title>A mitochondrial paradigm of metabolic and degenerative diseases, aging, and cancer: a dawn for evolutionary medicine.</article-title>             <source>Annu Rev Genet</source>             <volume>39</volume>             <fpage>359</fpage>             <lpage>407</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Anderson1"><label>4</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Anderson</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Bankier</surname><given-names>AT</given-names></name>
<name name-style="western"><surname>Barrell</surname><given-names>BG</given-names></name>
<name name-style="western"><surname>de Bruijn</surname><given-names>MH</given-names></name>
<name name-style="western"><surname>Coulson</surname><given-names>AR</given-names></name>
<etal/></person-group>             <year>1981</year>             <article-title>Sequence and organization of the human mitochondrial genome.</article-title>             <source>Nature</source>             <volume>290</volume>             <fpage>457</fpage>             <lpage>465</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Prokisch1"><label>5</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Prokisch</surname><given-names>H</given-names></name>
<name name-style="western"><surname>Andreoli</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Ahting</surname><given-names>U</given-names></name>
<name name-style="western"><surname>Heiss</surname><given-names>K</given-names></name>
<name name-style="western"><surname>Ruepp</surname><given-names>A</given-names></name>
<etal/></person-group>             <year>2006</year>             <article-title>MitoP2: the mitochondrial proteome database–now including mouse data.</article-title>             <source>Nucleic Acids Res</source>             <volume>34</volume>             <fpage>D705</fpage>             <lpage>711</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Chinnery1"><label>6</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Chinnery</surname><given-names>PF</given-names></name>
<name name-style="western"><surname>Turnbull</surname><given-names>DM</given-names></name>
</person-group>             <year>2001</year>             <article-title>Epidemiology and treatment of mitochondrial disorders.</article-title>             <source>Am J Med Genet</source>             <volume>106</volume>             <fpage>94</fpage>             <lpage>101</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Darin1"><label>7</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Darin</surname><given-names>N</given-names></name>
<name name-style="western"><surname>Oldfors</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Moslemi</surname><given-names>AR</given-names></name>
<name name-style="western"><surname>Holme</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Tulinius</surname><given-names>M</given-names></name>
</person-group>             <year>2001</year>             <article-title>The incidence of mitochondrial encephalomyopathies in childhood: clinical features and morphological, biochemical, and DNA anbormalities.</article-title>             <source>Ann Neurol</source>             <volume>49</volume>             <fpage>377</fpage>             <lpage>383</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Skladal1"><label>8</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Skladal</surname><given-names>D</given-names></name>
<name name-style="western"><surname>Halliday</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Thorburn</surname><given-names>DR</given-names></name>
</person-group>             <year>2003</year>             <article-title>Minimum birth prevalence of mitochondrial respiratory chain disorders in children.</article-title>             <source>Brain</source>             <volume>126</volume>             <fpage>1905</fpage>             <lpage>1912</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Enns1"><label>9</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Enns</surname><given-names>GM</given-names></name>
</person-group>             <year>2003</year>             <article-title>The contribution of mitochondria to common disorders.</article-title>             <source>Mol Genet Metab</source>             <volume>80</volume>             <fpage>11</fpage>             <lpage>26</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Dawson1"><label>10</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Dawson</surname><given-names>TM</given-names></name>
<name name-style="western"><surname>Dawson</surname><given-names>VL</given-names></name>
</person-group>             <year>2003</year>             <article-title>Molecular pathways of neurodegeneration in Parkinson's disease.</article-title>             <source>Science</source>             <volume>302</volume>             <fpage>819</fpage>             <lpage>822</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Rosca1"><label>11</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Rosca</surname><given-names>MG</given-names></name>
<name name-style="western"><surname>Vazquez</surname><given-names>EJ</given-names></name>
<name name-style="western"><surname>Kerner</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Parland</surname><given-names>W</given-names></name>
<name name-style="western"><surname>Chandler</surname><given-names>MP</given-names></name>
<etal/></person-group>             <year>2008</year>             <article-title>Cardiac mitochondria in heart failure: decrease in respirasomes and oxidative phosphorylation.</article-title>             <source>Cardiovasc Res</source>             <volume>80</volume>             <fpage>30</fpage>             <lpage>39</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Lowell1"><label>12</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Lowell</surname><given-names>BB</given-names></name>
<name name-style="western"><surname>Shulman</surname><given-names>GI</given-names></name>
</person-group>             <year>2005</year>             <article-title>Mitochondrial dysfunction and type 2 diabetes.</article-title>             <source>Science</source>             <volume>307</volume>             <fpage>384</fpage>             <lpage>387</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Delsite1"><label>13</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Delsite</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Kachhap</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Anbazhagan</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Gabrielson</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Singh</surname><given-names>KK</given-names></name>
</person-group>             <year>2002</year>             <article-title>Nuclear genes involved in mitochondria-to-nucleus communication in breast cancer cells.</article-title>             <source>Mol Cancer</source>             <volume>1</volume>             <fpage>6</fpage>          </element-citation></ref>
<ref id="pcbi.1000374-Eng1"><label>14</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Eng</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Kiuru</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Fernandez</surname><given-names>MJ</given-names></name>
<name name-style="western"><surname>Aaltonen</surname><given-names>LA</given-names></name>
</person-group>             <year>2003</year>             <article-title>A role for mitochondrial enzymes in inherited neoplasia and beyond.</article-title>             <source>Nat Rev Cancer</source>             <volume>3</volume>             <fpage>193</fpage>             <lpage>202</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Freimer1"><label>15</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Freimer</surname><given-names>N</given-names></name>
<name name-style="western"><surname>Sabatti</surname><given-names>C</given-names></name>
</person-group>             <year>2003</year>             <article-title>The human phenome project.</article-title>             <source>Nat Genet</source>             <volume>34</volume>             <fpage>15</fpage>             <lpage>21</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Brunner1"><label>16</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Brunner</surname><given-names>HG</given-names></name>
<name name-style="western"><surname>van Driel</surname><given-names>MA</given-names></name>
</person-group>             <year>2004</year>             <article-title>From syndrome families to functional genomics.</article-title>             <source>Nat Rev Genet</source>             <volume>5</volume>             <fpage>545</fpage>             <lpage>551</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Biesecker1"><label>17</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Biesecker</surname><given-names>LG</given-names></name>
</person-group>             <year>2005</year>             <article-title>Mapping phenotypes to language: a proposal to organize and standardize the clinical descriptions of malformations.</article-title>             <source>Clin Genet</source>             <volume>68</volume>             <fpage>320</fpage>             <lpage>326</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Nadkarni1"><label>18</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Nadkarni</surname><given-names>PM</given-names></name>
</person-group>             <year>2003</year>             <article-title>The challenges of recording phenotype in a generalizable and computable form.</article-title>             <source>Pharmacogenomics J</source>             <volume>3</volume>             <fpage>8</fpage>             <lpage>10</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-vanDriel1"><label>19</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>van Driel</surname><given-names>MA</given-names></name>
<name name-style="western"><surname>Bruggeman</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Vriend</surname><given-names>G</given-names></name>
<name name-style="western"><surname>Brunner</surname><given-names>HG</given-names></name>
<name name-style="western"><surname>Leunissen</surname><given-names>JA</given-names></name>
</person-group>             <year>2006</year>             <article-title>A text-mining analysis of the human phenome.</article-title>             <source>Eur J Hum Genet</source>             <volume>14</volume>             <fpage>535</fpage>             <lpage>542</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Singer1"><label>20</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Singer</surname><given-names>E</given-names></name>
</person-group>             <year>2005</year>             <article-title>“Phenome” project set to pin down subgroups of autism.</article-title>             <source>Nat Med</source>             <volume>11</volume>             <fpage>583</fpage>          </element-citation></ref>
<ref id="pcbi.1000374-Potash1"><label>21</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Potash</surname><given-names>JB</given-names></name>
<name name-style="western"><surname>Toolan</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Steele</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Miller</surname><given-names>EB</given-names></name>
<name name-style="western"><surname>Pearl</surname><given-names>J</given-names></name>
<etal/></person-group>             <year>2007</year>             <article-title>The bipolar disorder phenome database: a resource for genetic studies.</article-title>             <source>Am J Psychiatry</source>             <volume>164</volume>             <fpage>1229</fpage>             <lpage>1237</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Sabb1"><label>22</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Sabb</surname><given-names>FW</given-names></name>
<name name-style="western"><surname>Bearden</surname><given-names>CE</given-names></name>
<name name-style="western"><surname>Glahn</surname><given-names>DC</given-names></name>
<name name-style="western"><surname>Parker</surname><given-names>DS</given-names></name>
<name name-style="western"><surname>Freimer</surname><given-names>N</given-names></name>
<etal/></person-group>             <year>2008</year>             <article-title>A collaborative knowledge base for cognitive phenomics.</article-title>             <source>Mol Psychiatry</source>             <volume>13</volume>             <fpage>350</fpage>             <lpage>360</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Calvano1"><label>23</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Calvano</surname><given-names>SE</given-names></name>
<name name-style="western"><surname>Xiao</surname><given-names>W</given-names></name>
<name name-style="western"><surname>Richards</surname><given-names>DR</given-names></name>
<name name-style="western"><surname>Felciano</surname><given-names>RM</given-names></name>
<name name-style="western"><surname>Baker</surname><given-names>HV</given-names></name>
<etal/></person-group>             <year>2005</year>             <article-title>A network-based analysis of systemic inflammation in humans.</article-title>             <source>Nature</source>             <volume>437</volume>             <fpage>1032</fpage>             <lpage>1037</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-HernandezBoussard1"><label>24</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Hernandez-Boussard</surname><given-names>T</given-names></name>
<name name-style="western"><surname>Whirl-Carrillo</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Hebert</surname><given-names>JM</given-names></name>
<name name-style="western"><surname>Gong</surname><given-names>L</given-names></name>
<name name-style="western"><surname>Owen</surname><given-names>R</given-names></name>
<etal/></person-group>             <year>2008</year>             <article-title>The pharmacogenetics and pharmacogenomics knowledge base: accentuating the knowledge.</article-title>             <source>Nucleic Acids Res</source>             <volume>36</volume>             <fpage>D913</fpage>             <lpage>918</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Vo1"><label>25</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Vo</surname><given-names>TD</given-names></name>
<name name-style="western"><surname>Palsson</surname><given-names>BO</given-names></name>
</person-group>             <year>2007</year>             <article-title>Building the power house: recent advances in mitochondrial studies through proteomics and systems biology.</article-title>             <source>Am J Physiol Cell Physiol</source>             <volume>292</volume>             <fpage>C164</fpage>             <lpage>177</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Hamosh1"><label>26</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Hamosh</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Scott</surname><given-names>AF</given-names></name>
<name name-style="western"><surname>Amberger</surname><given-names>JS</given-names></name>
<name name-style="western"><surname>Bocchini</surname><given-names>CA</given-names></name>
<name name-style="western"><surname>McKusick</surname><given-names>VA</given-names></name>
</person-group>             <year>2005</year>             <article-title>Online Mendelian Inheritance in Man (OMIM), a knowledgebase of human genes and genetic disorders.</article-title>             <source>Nucleic Acids Res</source>             <volume>33 Database Issue</volume>             <fpage>D514</fpage>             <lpage>517</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-httpwww.nlm.nih.govmeshmeshhome.html1"><label>27</label><element-citation publication-type="other" xlink:type="simple">             <comment><ext-link ext-link-type="uri" xlink:href="http://www.nlm.nih.gov/mesh/meshhome.html" xlink:type="simple">http://www.nlm.nih.gov/mesh/meshhome.html</ext-link> Medical Subjects Heading Database</comment>          </element-citation></ref>
<ref id="pcbi.1000374-Holliday1"><label>28</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Holliday</surname><given-names>MA</given-names></name>
</person-group>             <year>1971</year>             <article-title>Metabolic rate and organ size during growth from infancy to maturity and during late gastation and early infancy.</article-title>             <source>Pediatrics</source>             <volume>47</volume><supplement>Suppl 2</supplement>             <fpage>169+</fpage>          </element-citation></ref>
<ref id="pcbi.1000374-Benard1"><label>29</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Benard</surname><given-names>G</given-names></name>
<name name-style="western"><surname>Faustin</surname><given-names>B</given-names></name>
<name name-style="western"><surname>Passerieux</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Galinier</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Rocher</surname><given-names>C</given-names></name>
<etal/></person-group>             <year>2006</year>             <article-title>Physiological diversity of mitochondrial oxidative phosphorylation.</article-title>             <source>Am J Physiol Cell Physiol</source>             <volume>291</volume>             <fpage>C1172</fpage>             <lpage>1182</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Storey1"><label>30</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Storey</surname><given-names>JD</given-names></name>
<name name-style="western"><surname>Madeoy</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Strout</surname><given-names>JL</given-names></name>
<name name-style="western"><surname>Wurfel</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Ronald</surname><given-names>J</given-names></name>
<etal/></person-group>             <year>2007</year>             <article-title>Gene-expression variation within and among human populations.</article-title>             <source>Am J Hum Genet</source>             <volume>80</volume>             <fpage>502</fpage>             <lpage>509</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Butte1"><label>31</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Butte</surname><given-names>AJ</given-names></name>
<name name-style="western"><surname>Kohane</surname><given-names>IS</given-names></name>
</person-group>             <year>2006</year>             <article-title>Creation and implications of a phenome-genome network.</article-title>             <source>Nat Biotechnol</source>             <volume>24</volume>             <fpage>55</fpage>             <lpage>62</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Lage1"><label>32</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Lage</surname><given-names>K</given-names></name>
<name name-style="western"><surname>Karlberg</surname><given-names>EO</given-names></name>
<name name-style="western"><surname>Storling</surname><given-names>ZM</given-names></name>
<name name-style="western"><surname>Olason</surname><given-names>PI</given-names></name>
<name name-style="western"><surname>Pedersen</surname><given-names>AG</given-names></name>
<etal/></person-group>             <year>2007</year>             <article-title>A human phenome-interactome network of protein complexes implicated in genetic disorders.</article-title>             <source>Nat Biotechnol</source>             <volume>25</volume>             <fpage>309</fpage>             <lpage>316</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Goh1"><label>33</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Goh</surname><given-names>KI</given-names></name>
<name name-style="western"><surname>Cusick</surname><given-names>ME</given-names></name>
<name name-style="western"><surname>Valle</surname><given-names>D</given-names></name>
<name name-style="western"><surname>Childs</surname><given-names>B</given-names></name>
<name name-style="western"><surname>Vidal</surname><given-names>M</given-names></name>
<etal/></person-group>             <year>2007</year>             <article-title>The human disease network.</article-title>             <source>Proc Natl Acad Sci U S A</source>             <volume>104</volume>             <fpage>8685</fpage>             <lpage>8690</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Franke1"><label>34</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Franke</surname><given-names>L</given-names></name>
<name name-style="western"><surname>Bakel</surname><given-names>H</given-names></name>
<name name-style="western"><surname>Fokkens</surname><given-names>L</given-names></name>
<name name-style="western"><surname>de Jong</surname><given-names>ED</given-names></name>
<name name-style="western"><surname>Egmont-Petersen</surname><given-names>M</given-names></name>
<etal/></person-group>             <year>2006</year>             <article-title>Reconstruction of a functional human gene network, with an application for prioritizing positional candidate genes.</article-title>             <source>Am J Hum Genet</source>             <volume>78</volume>             <fpage>1011</fpage>             <lpage>1025</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Braun1"><label>35</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Braun</surname><given-names>P</given-names></name>
<name name-style="western"><surname>Rietman</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Vidal</surname><given-names>M</given-names></name>
</person-group>             <year>2008</year>             <article-title>Networking metabolites and diseases.</article-title>             <source>Proc Natl Acad Sci U S A</source>             <volume>105</volume>             <fpage>9849</fpage>             <lpage>9850</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Calvo1"><label>36</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Calvo</surname><given-names>S</given-names></name>
<name name-style="western"><surname>Jain</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Xie</surname><given-names>X</given-names></name>
<name name-style="western"><surname>Sheth</surname><given-names>SA</given-names></name>
<name name-style="western"><surname>Chang</surname><given-names>B</given-names></name>
<etal/></person-group>             <year>2006</year>             <article-title>Systematic identification of human mitochondrial disease genes through integrative genomics.</article-title>             <source>Nat Genet</source>             <volume>38</volume>             <fpage>576</fpage>             <lpage>582</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Giaever1"><label>37</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Giaever</surname><given-names>G</given-names></name>
<name name-style="western"><surname>Chu</surname><given-names>AM</given-names></name>
<name name-style="western"><surname>Ni</surname><given-names>L</given-names></name>
<name name-style="western"><surname>Connelly</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Riles</surname><given-names>L</given-names></name>
<etal/></person-group>             <year>2002</year>             <article-title>Functional profiling of the Saccharomyces cerevisiae genome.</article-title>             <source>Nature</source>             <volume>418</volume>             <fpage>387</fpage>             <lpage>391</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Tiranti1"><label>38</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Tiranti</surname><given-names>V</given-names></name>
<name name-style="western"><surname>Hoertnagel</surname><given-names>K</given-names></name>
<name name-style="western"><surname>Carrozzo</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Galimberti</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Munaro</surname><given-names>M</given-names></name>
<etal/></person-group>             <year>1998</year>             <article-title>Mutations of SURF-1 in Leigh disease associated with cytochrome c oxidase deficiency.</article-title>             <source>Am J Hum Genet</source>             <volume>63</volume>             <fpage>1609</fpage>             <lpage>1621</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Steinmetz1"><label>39</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Steinmetz</surname><given-names>LM</given-names></name>
<name name-style="western"><surname>Scharfe</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Deutschbauer</surname><given-names>AM</given-names></name>
<name name-style="western"><surname>Mokranjac</surname><given-names>D</given-names></name>
<name name-style="western"><surname>Herman</surname><given-names>ZS</given-names></name>
<etal/></person-group>             <year>2002</year>             <article-title>Systematic screen for human disease genes in yeast.</article-title>             <source>Nat Genet</source>             <volume>31</volume>             <fpage>400</fpage>             <lpage>404</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Mootha1"><label>40</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Mootha</surname><given-names>VK</given-names></name>
<name name-style="western"><surname>Lepage</surname><given-names>P</given-names></name>
<name name-style="western"><surname>Miller</surname><given-names>K</given-names></name>
<name name-style="western"><surname>Bunkenborg</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Reich</surname><given-names>M</given-names></name>
<etal/></person-group>             <year>2003</year>             <article-title>Identification of a gene causing human cytochrome c oxidase deficiency by integrative genomics.</article-title>             <source>Proc Natl Acad Sci U S A</source>             <volume>100</volume>             <fpage>605</fpage>             <lpage>610</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Elpeleg1"><label>41</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Elpeleg</surname><given-names>O</given-names></name>
<name name-style="western"><surname>Miller</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Hershkovitz</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Bitner-Glindzicz</surname><given-names>M</given-names></name>
<name name-style="western"><surname>Bondi-Rubinstein</surname><given-names>G</given-names></name>
<etal/></person-group>             <year>2005</year>             <article-title>Deficiency of the ADP-forming succinyl-CoA synthase activity is associated with encephalomyopathy and mitochondrial DNA depletion.</article-title>             <source>Am J Hum Genet</source>             <volume>76</volume>             <fpage>1081</fpage>             <lpage>1086</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Spinazzola1"><label>42</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Spinazzola</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Viscomi</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Fernandez-Vizarra</surname><given-names>E</given-names></name>
<name name-style="western"><surname>Carrara</surname><given-names>F</given-names></name>
<name name-style="western"><surname>D'Adamo</surname><given-names>P</given-names></name>
<etal/></person-group>             <year>2006</year>             <article-title>MPV17 encodes an inner mitochondrial membrane protein and is mutated in infantile hepatic mitochondrial DNA depletion.</article-title>             <source>Nat Genet</source>             <volume>38</volume>             <fpage>570</fpage>             <lpage>575</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-1"><label>43</label><element-citation publication-type="other" xlink:type="simple">             <source>JMP Version 7</source>             <publisher-loc>Cary, NC</publisher-loc>             <publisher-name>SAS Institute Inc.</publisher-name>             <comment>1989–2007</comment>          </element-citation></ref>
<ref id="pcbi.1000374-httpwww.cs.waikato.ac.nzremcowekabn1"><label>44</label><element-citation publication-type="other" xlink:type="simple">             <comment><ext-link ext-link-type="uri" xlink:href="http://www.cs.waikato.ac.nz/~remco/weka_bn/" xlink:type="simple">http://www.cs.waikato.ac.nz/̃remco/weka_bn/</ext-link> WEKA Bayesian Network Classifier</comment>          </element-citation></ref>
<ref id="pcbi.1000374-Witten1"><label>45</label><element-citation publication-type="other" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Witten</surname><given-names>IH</given-names></name>
<name name-style="western"><surname>Frank</surname><given-names>E</given-names></name>
</person-group>             <year>2005</year>             <source>Data mining : practical machine learning tools and techniques</source>             <publisher-loc>Amsterdam; Boston, MA</publisher-loc>             <publisher-name>Morgan Kaufman</publisher-name>             <fpage>xxxi, 525</fpage>          </element-citation></ref>
<ref id="pcbi.1000374-Feldman1"><label>46</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Feldman</surname><given-names>I</given-names></name>
<name name-style="western"><surname>Rzhetsky</surname><given-names>A</given-names></name>
<name name-style="western"><surname>Vitkup</surname><given-names>D</given-names></name>
</person-group>             <year>2008</year>             <article-title>Network properties of genes harboring inherited disease mutations.</article-title>             <source>Proc Natl Acad Sci U S A</source>             <volume>105</volume>             <fpage>4323</fpage>             <lpage>4328</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Prokisch2"><label>47</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Prokisch</surname><given-names>H</given-names></name>
<name name-style="western"><surname>Scharfe</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Camp</surname><given-names>DG</given-names><suffix>2nd</suffix></name>
<name name-style="western"><surname>Xiao</surname><given-names>W</given-names></name>
<name name-style="western"><surname>David</surname><given-names>L</given-names></name>
<etal/></person-group>             <year>2004</year>             <article-title>Integrative analysis of the mitochondrial proteome in yeast.</article-title>             <source>PLoS Biol</source>             <volume>2</volume>             <fpage>e160</fpage>             <comment>doi:10.1371/journal.pbio.0020160</comment>          </element-citation></ref>
<ref id="pcbi.1000374-Ensenauer1"><label>48</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Ensenauer</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Niederhoff</surname><given-names>H</given-names></name>
<name name-style="western"><surname>Ruiter</surname><given-names>JP</given-names></name>
<name name-style="western"><surname>Wanders</surname><given-names>RJ</given-names></name>
<name name-style="western"><surname>Schwab</surname><given-names>KO</given-names></name>
<etal/></person-group>             <year>2002</year>             <article-title>Clinical variability in 3-hydroxy-2-methylbutyryl-CoA dehydrogenase deficiency.</article-title>             <source>Ann Neurol</source>             <volume>51</volume>             <fpage>656</fpage>             <lpage>659</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Sass1"><label>49</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Sass</surname><given-names>JO</given-names></name>
<name name-style="western"><surname>Forstner</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Sperl</surname><given-names>W</given-names></name>
</person-group>             <year>2004</year>             <article-title>2-Methyl-3-hydroxybutyryl-CoA dehydrogenase deficiency: impaired catabolism of isoleucine presenting as neurodegenerative disease.</article-title>             <source>Brain Dev</source>             <volume>26</volume>             <fpage>12</fpage>             <lpage>14</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-PerezCerda1"><label>50</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Perez-Cerda</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Garcia-Villoria</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Ofman</surname><given-names>R</given-names></name>
<name name-style="western"><surname>Sala</surname><given-names>PR</given-names></name>
<name name-style="western"><surname>Merinero</surname><given-names>B</given-names></name>
<etal/></person-group>             <year>2005</year>             <article-title>2-Methyl-3-hydroxybutyryl-CoA dehydrogenase (MHBD) deficiency: an X-linked inborn error of isoleucine metabolism that may mimic a mitochondrial disease.</article-title>             <source>Pediatr Res</source>             <volume>58</volume>             <fpage>488</fpage>             <lpage>491</lpage>          </element-citation></ref>
<ref id="pcbi.1000374-Lim1"><label>51</label><element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author">
<name name-style="western"><surname>Lim</surname><given-names>J</given-names></name>
<name name-style="western"><surname>Hao</surname><given-names>T</given-names></name>
<name name-style="western"><surname>Shaw</surname><given-names>C</given-names></name>
<name name-style="western"><surname>Patel</surname><given-names>AJ</given-names></name>
<name name-style="western"><surname>Szabo</surname><given-names>G</given-names></name>
<etal/></person-group>             <year>2006</year>             <article-title>A protein-protein interaction network for human inherited ataxias and disorders of Purkinje cell degeneration.</article-title>             <source>Cell</source>             <volume>125</volume>             <fpage>801</fpage>             <lpage>814</lpage>          </element-citation></ref>
</ref-list>

</back>
</article>