<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS Comput Biol</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">ploscomp</journal-id>
<journal-title-group>
<journal-title>PLOS Computational Biology</journal-title>
</journal-title-group>
<issn pub-type="ppub">1553-734X</issn>
<issn pub-type="epub">1553-7358</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">PCOMPBIOL-D-17-00624</article-id>
<article-id pub-id-type="doi">10.1371/journal.pcbi.1005694</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Computer and information sciences</subject><subj-group><subject>Network analysis</subject><subj-group><subject>Protein interaction networks</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Biochemistry</subject><subj-group><subject>Proteomics</subject><subj-group><subject>Protein interaction networks</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Physical sciences</subject><subj-group><subject>Mathematics</subject><subj-group><subject>Applied mathematics</subject><subj-group><subject>Algorithms</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Research and analysis methods</subject><subj-group><subject>Simulation and modeling</subject><subj-group><subject>Algorithms</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Biochemistry</subject><subj-group><subject>Proteins</subject><subj-group><subject>Protein interactions</subject><subj-group><subject>Protein-protein interactions</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Ecology</subject><subj-group><subject>Ecosystems</subject><subj-group><subject>Forests</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Ecology and environmental sciences</subject><subj-group><subject>Ecology</subject><subj-group><subject>Ecosystems</subject><subj-group><subject>Forests</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Ecology and environmental sciences</subject><subj-group><subject>Terrestrial environments</subject><subj-group><subject>Forests</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Computer and information sciences</subject><subj-group><subject>Network analysis</subject></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Oncology</subject><subj-group><subject>Cancers and neoplasms</subject><subj-group><subject>Lung and intrathoracic tumors</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Research and analysis methods</subject><subj-group><subject>Database and informatics methods</subject><subj-group><subject>Biological databases</subject><subj-group><subject>Proteomic databases</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Biochemistry</subject><subj-group><subject>Proteomics</subject><subj-group><subject>Proteomic databases</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3"><subject>Research and analysis methods</subject><subj-group><subject>Database and informatics methods</subject><subj-group><subject>Bioinformatics</subject></subj-group></subj-group></subj-group></article-categories>
<title-group>
<article-title>PCSF: An R-package for network-based interpretation of high-throughput data</article-title>
<alt-title alt-title-type="running-head">PCSF: An R-package for network-based interpretation of high-throughput data</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Akhmedov</surname> <given-names>Murodzhon</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Formal analysis</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Visualization</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-6156-5046</contrib-id>
<name name-style="western">
<surname>Kedaigle</surname> <given-names>Amanda</given-names></name>
<role content-type="http://credit.casrai.org/">Data curation</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-6913-4910</contrib-id>
<name name-style="western">
<surname>Chong</surname> <given-names>Renan Escalante</given-names></name>
<role content-type="http://credit.casrai.org/">Visualization</role>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
<xref ref-type="fn" rid="currentaff001"><sup>¤</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-0229-0465</contrib-id>
<name name-style="western">
<surname>Montemanni</surname> <given-names>Roberto</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Funding acquisition</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Project administration</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-5637-8983</contrib-id>
<name name-style="western">
<surname>Bertoni</surname> <given-names>Francesco</given-names></name>
<role content-type="http://credit.casrai.org/">Funding acquisition</role>
<role content-type="http://credit.casrai.org/">Resources</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-9249-8181</contrib-id>
<name name-style="western">
<surname>Fraenkel</surname> <given-names>Ernest</given-names></name>
<role content-type="http://credit.casrai.org/">Data curation</role>
<role content-type="http://credit.casrai.org/">Funding acquisition</role>
<role content-type="http://credit.casrai.org/">Resources</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-2751-4218</contrib-id>
<name name-style="western">
<surname>Kwee</surname> <given-names>Ivo</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Funding acquisition</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Project administration</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
</contrib-group>
<aff id="aff001">
<label>1</label>
<addr-line>Dalle Molle Institute for Artificial Intelligence Research (USI/SUPSI), Manno, Switzerland</addr-line>
</aff>
<aff id="aff002">
<label>2</label>
<addr-line>Institute of Oncology Research (IOR), Bellinzona, Switzerland</addr-line>
</aff>
<aff id="aff003">
<label>3</label>
<addr-line>Swiss Institute of Bioinformatics (SIB), Lausanne, Switzerland</addr-line>
</aff>
<aff id="aff004">
<label>4</label>
<addr-line>Department of Biological Engineering, MIT, Cambridge, Massachusetts, United States of America</addr-line>
</aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Schneidman</surname> <given-names>Dina</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1">
<addr-line>Hebrew University of Jerusalem, ISRAEL</addr-line>
</aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>The authors have declared that no competing interests exist.</p>
</fn>
<fn fn-type="current-aff" id="currentaff001">
<label>¤</label><p>Current address: Systems Biology, Associate Director, Immuneering Corporation, Cambridge, Massachusetts, United States of America</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">fraenkel@mit.edu</email> (EF); <email xlink:type="simple">ivo.kwee@ior.iosi.ch</email>, <email xlink:type="simple">ivo.kwee@gmail.com</email> (IK)</corresp>
</author-notes>
<pub-date pub-type="collection">
<month>7</month>
<year>2017</year>
</pub-date>
<pub-date pub-type="epub">
<day>31</day>
<month>7</month>
<year>2017</year>
</pub-date>
<volume>13</volume>
<issue>7</issue>
<elocation-id>e1005694</elocation-id>
<history>
<date date-type="received">
<day>3</day>
<month>5</month>
<year>2017</year>
</date>
<date date-type="accepted">
<day>23</day>
<month>7</month>
<year>2017</year>
</date>
</history>
<permissions>
<copyright-year>2017</copyright-year>
<copyright-holder>Akhmedov et al</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pcbi.1005694"/>
<abstract>
<p>With the recent technological developments a vast amount of high-throughput data has been profiled to understand the mechanism of complex diseases. The current bioinformatics challenge is to interpret the data and underlying biology, where efficient algorithms for analyzing heterogeneous high-throughput data using biological networks are becoming increasingly valuable. In this paper, we propose a software package based on the Prize-collecting Steiner Forest graph optimization approach. The PCSF package performs fast and user-friendly network analysis of high-throughput data by mapping the data onto a biological networks such as protein-protein interaction, gene-gene interaction or any other correlation or coexpression based networks. Using the interaction networks as a template, it determines high-confidence subnetworks relevant to the data, which potentially leads to predictions of functional units. It also interactively visualizes the resulting subnetwork with functional enrichment analysis.</p>
</abstract>
<funding-group>
<award-group id="award001">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/501100001711</institution-id>
<institution>Schweizerischer Nationalfonds zur Förderung der Wissenschaftlichen Forschung</institution>
</institution-wrap>
</funding-source>
<award-id>205321-147138/1</award-id>
<principal-award-recipient>
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-2751-4218</contrib-id>
<name name-style="western">
<surname>Kwee</surname> <given-names>Ivo</given-names></name>
</principal-award-recipient>
</award-group>
<award-group id="award002">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/100000002</institution-id>
<institution>National Institutes of Health</institution>
</institution-wrap>
</funding-source>
<award-id>U54-NS-091046</award-id>
<principal-award-recipient>
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-9249-8181</contrib-id>
<name name-style="western">
<surname>Fraenkel</surname> <given-names>Ernest</given-names></name>
</principal-award-recipient>
</award-group>
<award-group id="award003">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/100000002</institution-id>
<institution>National Institutes of Health</institution>
</institution-wrap>
</funding-source>
<award-id>U01-CA-184898</award-id>
<principal-award-recipient>
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-9249-8181</contrib-id>
<name name-style="western">
<surname>Fraenkel</surname> <given-names>Ernest</given-names></name>
</principal-award-recipient>
</award-group>
<funding-statement>MA was supported by the Swiss National Science Foundation (205321-147138/1, <ext-link ext-link-type="uri" xlink:href="http://www.snf.ch" xlink:type="simple">www.snf.ch</ext-link>). MA (partially) and AK were supported by the National Institute of Health (U54-NS-091046 and U01-CA-184898, <ext-link ext-link-type="uri" xlink:href="http://www.nih.gov" xlink:type="simple">www.nih.gov</ext-link>). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement>
</funding-group>
<counts>
<fig-count count="1"/>
<table-count count="1"/>
<page-count count="7"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>PLOS Publication Stage</meta-name>
<meta-value>vor-update-to-uncorrected-proof</meta-value>
</custom-meta>
<custom-meta>
<meta-name>Publication Update</meta-name>
<meta-value>2017-08-10</meta-value>
</custom-meta>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>The package and tutorials are available on GitHub at <ext-link ext-link-type="uri" xlink:href="https://github.com/IOR-Bioinformatics/PCSF" xlink:type="simple">https://github.com/IOR-Bioinformatics/PCSF</ext-link>.</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<disp-quote><p>This is a <italic>PLOS Computational Biology</italic> Software paper.</p></disp-quote>
<sec id="sec001" sec-type="intro">
<title>Introduction</title>
<p>A tremendous quantity of high-throughput data at multiple layers of cellular systems has been profiled to study biological responses to perturbations and diseases. The current challenge is to develop methods for effective analysis of these data to better interpret underlying biology and identify functional units. Network modeling approaches are some of the techniques lately used for analysis of biological networks [<xref ref-type="bibr" rid="pcbi.1005694.ref001">1</xref>, <xref ref-type="bibr" rid="pcbi.1005694.ref002">2</xref>]. Recently, the Prize-collecting Steiner Forest (PCSF) algorithm has been applied to interaction networks to find a subnetwork enriched for input data, which corresponds to relevant subunits in the interactome of a cell [<xref ref-type="bibr" rid="pcbi.1005694.ref003">3</xref>, <xref ref-type="bibr" rid="pcbi.1005694.ref004">4</xref>].</p>
<p>The PCSF problem has NP-hard characteristics, and it requires a great deal of effort to find exact solutions on larger biological networks. Recently, we have developed a fast heuristic for the PCSF [<xref ref-type="bibr" rid="pcbi.1005694.ref005">5</xref>], and conducted a detailed performance comparison with existing methods [<xref ref-type="bibr" rid="pcbi.1005694.ref006">6</xref>]. As an extension to this, we present an R package that performs fast and user-friendly analysis of high-throughput data using the interaction networks as a template, and interprets the biological landscape of interactome with respect to the data. More specifically, the PCSF package allows the user to i) upload the interactome and patient data ii) compute the PCSF subnetwork solution iii) perform functional analysis on resulting subnetwork iv) and interactively visualize the final subnetwork with functional enrichment information.</p>
</sec>
<sec id="sec002" sec-type="materials|methods">
<title>Design and implementation</title>
<sec id="sec003">
<title>The PCSF methodology</title>
<p>The PCSF is a well-known problem in graph theory. Given an undirected graph <italic>G</italic> = (<italic>V</italic>, <italic>E</italic>), where the vertices are labeled with prizes <italic>p</italic><sub><italic>v</italic></sub> and the edges are labeled with costs <italic>c</italic><sub><italic>e</italic></sub> &gt; 0, the goal is to identify a subnetwork <italic>G</italic>′ = (<italic>V</italic>′, <italic>E</italic>′) with a forest structure. The target is to minimize the total edge costs in <italic>E</italic>′, the total node prizes left out of <italic>V</italic>′, and the number of trees in <italic>G</italic>′. This is equivalent to minimization of the following objective function:
<disp-formula id="pcbi.1005694.e001"><alternatives><graphic id="pcbi.1005694.e001g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1005694.e001" xlink:type="simple"/><mml:math display="block" id="M1"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>F</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msup><mml:mi>G</mml:mi> <mml:mo>′</mml:mo></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>=</mml:mo> <mml:mtext>Minimize</mml:mtext> <mml:munder><mml:mo>∑</mml:mo> <mml:mrow><mml:mi>e</mml:mi> <mml:mo>∈</mml:mo> <mml:msup><mml:mi>E</mml:mi> <mml:mo>′</mml:mo></mml:msup></mml:mrow></mml:munder> <mml:msub><mml:mi>c</mml:mi> <mml:mi>e</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:mi>β</mml:mi> <mml:mo>·</mml:mo> <mml:munder><mml:mo>∑</mml:mo> <mml:mrow><mml:mi>v</mml:mi> <mml:mo>∉</mml:mo> <mml:msup><mml:mi>V</mml:mi> <mml:mo>′</mml:mo></mml:msup></mml:mrow></mml:munder> <mml:msub><mml:mi>p</mml:mi> <mml:mi>v</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:mi>w</mml:mi> <mml:mo>·</mml:mo> <mml:mi>k</mml:mi></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(1)</label></disp-formula>
where <italic>k</italic> is the number of trees in the forest, and it is regulated by parameter <italic>w</italic>. The parameter <italic>β</italic> is used to tune the prizes of nodes relative to edge costs.</p>
<p>Recently, we have applied PCSF to biological networks in the Forest module of the Omics Integrator software [<xref ref-type="bibr" rid="pcbi.1005694.ref004">4</xref>]. In biological networks such as protein-protein interaction (PPI) networks, every vertex represents a biomolecule, and every edge corresponds to the cellular interaction between two biomolecules. Edges of the network are given costs which correspond to confidence or frequency of that interaction. The vertices of the network are given prizes according to the measurements of differential expression, copy number, or number of mutation for that gene or protein. The set of vertices that are assigned a prize are referred to as <italic>terminal</italic> nodes. Non-terminal nodes, which were not observed in the experimental data, may appear in the solution and are called <italic>Steiner</italic> nodes. After scoring the interactome, the PCSF is used to detect a relevant subnetwork (forest). The PCSF aims to identify neighborhoods in interaction networks potentially belonging to the key dysregulated pathways of a disease or experiment.</p>
<p>In order to avoid a bias for the hub nodes of PPI networks to appear in solution of PCSF, we use the method introduced in Forest [<xref ref-type="bibr" rid="pcbi.1005694.ref004">4</xref>], which penalizes the prizes of nodes according to their degree in the PPI. Within the implementation, we use the parameter <italic>μ</italic> to fine-tune the penalties as:
<disp-formula id="pcbi.1005694.e002"><alternatives><graphic id="pcbi.1005694.e002g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pcbi.1005694.e002" xlink:type="simple"/><mml:math display="block" id="M2"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msubsup><mml:mi>p</mml:mi> <mml:mi>v</mml:mi> <mml:mo>′</mml:mo></mml:msubsup> <mml:mo>=</mml:mo> <mml:msub><mml:mi>p</mml:mi> <mml:mi>v</mml:mi></mml:msub> <mml:mo>-</mml:mo> <mml:mi>μ</mml:mi> <mml:mo>*</mml:mo> <mml:mtext>degree</mml:mtext> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>v</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>.</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(2)</label></disp-formula>
The parameter <italic>μ</italic> also affects the total number of <italic>Steiner</italic> nodes in the solution. The higher the value of <italic>μ</italic>, the smaller the number of <italic>Steiner</italic> nodes in the subnetwork, and vice-versa. The recommended range of <italic>μ</italic> for biological networks is between 1e-4 and 5e-2 to fine-tune the <italic>Steiner</italic>/<italic>terminal</italic> node ratio in the subnetwork and average <italic>Steiner</italic>/<italic>terminal</italic> in-degree ratio of the corresponding nodes in the original template network.</p>
</sec>
<sec id="sec004">
<title>Implementation, dependencies, and installation</title>
<p>The software was implemented in R environment, and easily can be installed within the R terminal. As input, the package requires a template network such as protein-protein interaction, protein-metabolite interaction or any other correlation-based interaction network, and it maps differentially expressed genes/proteins/metabolites from the high-throughput data as vertex prizes into the template network. Then, it computes and returns high-scoring neighborhoods to identify functional modules in the interactome. Required parameters are: <italic>β</italic>—for tuning the vertex prizes, <italic>ω</italic>—for regulating the number of distinct components in the subnetwork, and <italic>μ</italic>—for hub penalization.</p>
<p>The package has the following R-package dependencies:</p>
<list list-type="bullet">
<list-item>
<p>BH and igraph—for efficient graph handling and calculations,</p>
</list-item>
<list-item>
<p>httr, methods, org.Hs.eg.db, and topGO—for enrichment analysis,</p>
</list-item>
<list-item>
<p>Rcpp—to employ C++ source code within R,</p>
</list-item>
<list-item>
<p>visNetwork—for visualization.</p>
</list-item>
</list>
<p>The dependencies are automatically installed along with the PCSF package. For more details about the package dependencies and installation we refer the reader to see the supplementary documents.</p>
</sec>
<sec id="sec005">
<title>The software test</title>
<p>A software was successfully installed and tested in the following environments: Mac OS X (10.12.4) R 3.4.0, Ubuntu (16.04) R 3.2.3, Windows 7 R 3.4.1. We have analyzed over 100 biological network instances within the computational performance comparison, and illustrated our method in a biological application to interpret the phosphoproteomic data derived from H358 cells, a model of lung cancer. Few dozens of people have tested the package on installation, debugging, parameter setting, and own data. We provided the interaction network and the phosphoproteomic data from the lung cancer within the package. Any bugs, suggestions and request related to the package can be reported throughout its GitHub repository (<ext-link ext-link-type="uri" xlink:href="https://github.com/IOR-Bioinformatics/PCSF" xlink:type="simple">https://github.com/IOR-Bioinformatics/PCSF</ext-link>).</p>
</sec>
</sec>
<sec id="sec006" sec-type="results">
<title>Results</title>
<sec id="sec007">
<title>Computational performance comparison</title>
<p>In this section, we compare the computational performance of our method with the message passing (MSGP) [<xref ref-type="bibr" rid="pcbi.1005694.ref003">3</xref>] algorithm. The belief propagation has been used in similar biological application such as identification of unknown protein associations [<xref ref-type="bibr" rid="pcbi.1005694.ref003">3</xref>], prediction of hidden components in regulatory networks [<xref ref-type="bibr" rid="pcbi.1005694.ref007">7</xref>], and reconstruction of multiple dysregulated pathways [<xref ref-type="bibr" rid="pcbi.1005694.ref008">8</xref>]. As a template network, we used an integrated interactome of proteins [<xref ref-type="bibr" rid="pcbi.1005694.ref009">9</xref>] and metabolites [<xref ref-type="bibr" rid="pcbi.1005694.ref010">10</xref>], which composed of 36892 nodes and 1016411 edges. We employed the phosphoproteomic data from the Breast Cancer patients in [<xref ref-type="bibr" rid="pcbi.1005694.ref011">11</xref>]. A network instances are generated by mapping each patient’s differential phosphoproteomic data as <italic>terminal</italic> nodes onto template interactome. We tested the methods for <italic>ω</italic> = {1, 2}, and provided the average statistics of 10 runs to maintain a fair comparison baseline.</p>
<p>The comparison statistics of the methods are reported in <xref ref-type="table" rid="pcbi.1005694.t001">Table 1</xref>. The performance of the MSGP [<xref ref-type="bibr" rid="pcbi.1005694.ref003">3</xref>] algorithm [<xref ref-type="bibr" rid="pcbi.1005694.ref003">3</xref>] and our method are provided under the MSGP and PCSF columns, respectively. The <italic>μ</italic> value was set to 0 for both methods to be comparable, which removes its impact on the objective function values. The solution qualities and running times of the approaches are displayed in the table. For these large network instances, the PCSF provides comparable quality solutions to the belief propagation algorithm for both values of <italic>ω</italic>. On other hand, the PCSF significantly outperformed the belief propagation in terms of running times. There is approximately ten times speed up on average, and it can be useful to analyze large biological networks in a reasonable time.</p>
<table-wrap id="pcbi.1005694.t001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1005694.t001</object-id>
<label>Table 1</label>
<caption>
<title>The results of the methods for the Breast Cancer network instances generated using the phosphoproteomic data in [<xref ref-type="bibr" rid="pcbi.1005694.ref011">11</xref>].</title>
<p>The performance of the message passing algorithm [<xref ref-type="bibr" rid="pcbi.1005694.ref003">3</xref>] and the proposed method are respectively displayed under MSGP [<xref ref-type="bibr" rid="pcbi.1005694.ref003">3</xref>] and PCSF for <italic>ω</italic> = {1, 2}. The OBJ column reports the quality of the solutions (objective function values) obtained by the methods, and the running times of the algorithms are displayed under t(s) in seconds. The average statistics of 10 runs provided by both algorithms are reported for each instance.</p>
</caption>
<alternatives>
<graphic id="pcbi.1005694.t001g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1005694.t001" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center" colspan="2" rowspan="2"/>
<th align="center" colspan="4"><italic>ω</italic> = 1</th>
<th align="center" colspan="4"><italic>ω</italic> = 2</th>
</tr>
<tr>
<th align="center" colspan="2">MSGP [<xref ref-type="bibr" rid="pcbi.1005694.ref003">3</xref>]</th>
<th align="center" colspan="2">PCSF</th>
<th align="center" colspan="2">MSGP [<xref ref-type="bibr" rid="pcbi.1005694.ref003">3</xref>]</th>
<th align="center" colspan="2">PCSF</th>
</tr>
<tr>
<th align="center">Instance</th>
<th align="center">Terminals</th>
<th align="center">OBJ</th>
<th align="center">t(s)</th>
<th align="center">OBJ</th>
<th align="center">t(s)</th>
<th align="center">OBJ</th>
<th align="center">t(s)</th>
<th align="center">OBJ</th>
<th align="center">t(s)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="center">Basal-AN-A0AL</td>
<td align="center">92</td>
<td align="char" char=".">26.94</td>
<td align="center">1920</td>
<td align="char" char=".">27.18</td>
<td align="center">101</td>
<td align="char" char=".">27.94</td>
<td align="center">2025</td>
<td align="char" char=".">28.18</td>
<td align="center">100</td>
</tr>
<tr>
<td align="center">Basal-BH-A18Q</td>
<td align="center">283</td>
<td align="char" char=".">80.81</td>
<td align="center">2188</td>
<td align="char" char=".">81.31</td>
<td align="center">291</td>
<td align="char" char=".">82.89</td>
<td align="center">1532</td>
<td align="char" char=".">82.8</td>
<td align="center">297</td>
</tr>
<tr>
<td align="center">Her2-C8-A12Z</td>
<td align="center">63</td>
<td align="char" char=".">19.42</td>
<td align="center">1422</td>
<td align="char" char=".">19.51</td>
<td align="center">71</td>
<td align="char" char=".">20.42</td>
<td align="center">1151</td>
<td align="char" char=".">20.51</td>
<td align="center">71</td>
</tr>
<tr>
<td align="center">Her2-C8-A12L</td>
<td align="center">75</td>
<td align="char" char=".">25.07</td>
<td align="center">1002</td>
<td align="char" char=".">25.31</td>
<td align="center">83</td>
<td align="char" char=".">26.07</td>
<td align="center">1134</td>
<td align="char" char=".">26.31</td>
<td align="center">83</td>
</tr>
<tr>
<td align="center">Her2-A2-A0EQ</td>
<td align="center">139</td>
<td align="char" char=".">35.02</td>
<td align="center">1583</td>
<td align="char" char=".">35.33</td>
<td align="center">147</td>
<td align="char" char=".">36.02</td>
<td align="center">1545</td>
<td align="char" char=".">36.33</td>
<td align="center">148</td>
</tr>
<tr>
<td align="center">Her2-C8-A135</td>
<td align="center">193</td>
<td align="char" char=".">52.83</td>
<td align="center">1762</td>
<td align="char" char=".">53.19</td>
<td align="center">199</td>
<td align="char" char=".">53.85</td>
<td align="center">1680</td>
<td align="char" char=".">54.22</td>
<td align="center">200</td>
</tr>
<tr>
<td align="center">LumA-AO-A0JJ</td>
<td align="center">168</td>
<td align="char" char=".">50.2</td>
<td align="center">1970</td>
<td align="char" char=".">50.57</td>
<td align="center">176</td>
<td align="char" char=".">51.38</td>
<td align="center">1729</td>
<td align="char" char=".">51.83</td>
<td align="center">175</td>
</tr>
<tr>
<td align="center">LumA-A8-A08Z</td>
<td align="center">174</td>
<td align="char" char=".">48.55</td>
<td align="center">1749</td>
<td align="char" char=".">48.81</td>
<td align="center">179</td>
<td align="char" char=".">49.61</td>
<td align="center">1904</td>
<td align="char" char=".">49.87</td>
<td align="center">181</td>
</tr>
<tr>
<td align="center">LumA-BH-A0C1</td>
<td align="center">201</td>
<td align="char" char=".">52.42</td>
<td align="center">2092</td>
<td align="char" char=".">52.82</td>
<td align="center">210</td>
<td align="char" char=".">53.42</td>
<td align="center">1992</td>
<td align="char" char=".">53.82</td>
<td align="center">207</td>
</tr>
<tr>
<td align="center">LumB-AN-A0AJ</td>
<td align="center">149</td>
<td align="char" char=".">42.94</td>
<td align="center">2220</td>
<td align="char" char=".">43.32</td>
<td align="center">155</td>
<td align="char" char=".">43.96</td>
<td align="center">1732</td>
<td align="char" char=".">44.35</td>
<td align="center">156</td>
</tr>
<tr>
<td align="center">LumB-A7-A0CJ</td>
<td align="center">158</td>
<td align="char" char=".">45.36</td>
<td align="center">2506</td>
<td align="char" char=".">45.84</td>
<td align="center">167</td>
<td align="char" char=".">47.02</td>
<td align="center">1476</td>
<td align="char" char=".">47.52</td>
<td align="center">170</td>
</tr>
<tr>
<td align="center">LumB-AR-A1AV</td>
<td align="center">190</td>
<td align="char" char=".">56.47</td>
<td align="center">1656</td>
<td align="char" char=".">56.88</td>
<td align="center">199</td>
<td align="char" char=".">57.85</td>
<td align="center">1506</td>
<td align="char" char=".">58.26</td>
<td align="center">198</td>
</tr>
<tr>
<td align="center">LumB-AO-A03O</td>
<td align="center">193</td>
<td align="char" char=".">54.95</td>
<td align="center">1878</td>
<td align="char" char=".">55.22</td>
<td align="center">205</td>
<td align="char" char=".">55.87</td>
<td align="center">1239</td>
<td align="char" char=".">56.22</td>
<td align="center">197</td>
</tr>
<tr>
<td align="center">LumB-BH-A0DD</td>
<td align="center">230</td>
<td align="char" char=".">60.31</td>
<td align="center">2297</td>
<td align="char" char=".">60.65</td>
<td align="center">235</td>
<td align="char" char=".">61.37</td>
<td align="center">2358</td>
<td align="char" char=".">61.71</td>
<td align="center">238</td>
</tr>
<tr>
<td align="center">LumB-A2-A0T3</td>
<td align="center">248</td>
<td align="char" char=".">65.83</td>
<td align="center">1793</td>
<td align="char" char=".">66.05</td>
<td align="center">261</td>
<td align="char" char=".">66.91</td>
<td align="center">2053</td>
<td align="char" char=".">67.13</td>
<td align="center">256</td>
</tr>
<tr>
<td align="center" rowspan="2"/>
<td align="center"><italic>mean</italic></td>
<td align="char" char=".">47.81</td>
<td align="center">1869</td>
<td align="char" char=".">48.13</td>
<td align="center">179</td>
<td align="char" char=".">48.97</td>
<td align="center">1670</td>
<td align="char" char=".">49.27</td>
<td align="center">178</td>
</tr>
<tr>
<td align="center"><italic>std</italic></td>
<td align="char" char=".">16.26</td>
<td align="center">377</td>
<td align="char" char=".">16.32</td>
<td align="center">62</td>
<td align="char" char=".">16.43</td>
<td align="center">354</td>
<td align="char" char=".">16.42</td>
<td align="center">62</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
<p>For more information about the PCSF algorithm and rigorous performance comparisons, the interested readers are referred to [<xref ref-type="bibr" rid="pcbi.1005694.ref006">6</xref>].</p>
</sec>
<sec id="sec008">
<title>Biological application</title>
<p>In this section, we demonstrate the usage of the PCSF package on biological data, discuss the package functionalities and its output within the R environment. We analyze differential phosphoproteomic data derived from H358 cells, a model of lung cancer, that were stimulated with TGF-<italic>β</italic>. These data were previously published in [<xref ref-type="bibr" rid="pcbi.1005694.ref012">12</xref>], and were also used to demonstrate Omics Integrator [<xref ref-type="bibr" rid="pcbi.1005694.ref004">4</xref>]. We construct a template PPI network from the STRING database (version 13) [<xref ref-type="bibr" rid="pcbi.1005694.ref009">9</xref>] and apply some filtering steps [<xref ref-type="bibr" rid="pcbi.1005694.ref006">6</xref>]. A named vector containing the proteomic data and a data frame containing the filtered PPI is available within the package. The template network and data are loaded into R environment as follows:</p>
<list list-type="simple">
<list-item>
<p>
<monospace>&gt; data(“STRING”)</monospace>
</p>
</list-item>
<list-item>
<p>
<monospace>&gt; ppi &lt;- construct_interactome(STRING)</monospace>
</p>
</list-item>
<list-item>
<p>
<monospace>&gt; data(“Tgfb_phospho”)</monospace>
</p>
</list-item>
<list-item>
<p>
<monospace>&gt; terminals &lt;- Tgfb_phospho</monospace>
</p>
</list-item>
</list>
<p>The resulting PPI network consists of 17581 edges and 15405 nodes, out of which 58 terminal nodes correspond to differentially phosphorylated proteins. After loading the PPI network and assigning the terminal prizes, we use <monospace>PCSF()</monospace> to find high-confidence subnetworks by providing parameters <italic>β</italic>, <italic>ω</italic> and <italic>μ</italic> as it is discussed in Section. The dynamic and interactive output subnetwork can be plotted with <monospace>plot()</monospace> function.</p>
<list list-type="simple">
<list-item>
<p>
<monospace>&gt; subnet &lt;- PCSF(ppi, terminals, w = 2, b = 1, mu = 0.0005)</monospace>
</p>
</list-item>
<list-item>
<p>
<monospace>&gt; plot(subnet)</monospace>
</p>
</list-item>
</list>
<p>Given that the edge weights and input data were often derived from high-throughput data and are necessarily noisy, it is recommended to test the robustness of the solution. One way to do this is to solve the PCSF several times while adding noise to edge costs, and combine all results in the final subnetwork. Edges and nodes are then given scores indicating how many times they appeared in the solutions with varying edge costs.</p>
<list list-type="simple">
<list-item>
<p>
<monospace>&gt; subnet &lt;- PCSF_rand(ppi, terminals, n = 10, r = 0.1, w = 2, b = 1, mu = 0.0005)</monospace>
</p>
</list-item>
</list>
<p>Next, an enrichment analysis of the final subnetwork is performed for functional interpretation. The subnetwork is clustered using the edge betweenness clustering algorithm from the igraph R-package, and for each cluster, functional enrichment is done by employing either EnrichR [<xref ref-type="bibr" rid="pcbi.1005694.ref013">13</xref>] API or topGO [<xref ref-type="bibr" rid="pcbi.1005694.ref014">14</xref>] R-package that can be specified by the user. Note that EnrichR API requires a working internet connection to perform the enrichment. If not specified, the package defaults to EnrichR, it uses topGO if there is no internet connection.</p>
<p>An interactive version of the annotated subnetwork can be visualized as in <xref ref-type="fig" rid="pcbi.1005694.g001">Fig 1</xref>. In the case of the Tgf-<italic>β</italic> stimulation data, the subnetwork provided by PCSF was enriched for relevant Gene Ontology terms like “mesenchymal-epithelial cell signaling” and “EGFR downregulation”. We also see Steiner nodes such as CBL and ITGB5, which have been shown to be involved in several models of non-small cell lung cancers [<xref ref-type="bibr" rid="pcbi.1005694.ref015">15</xref>], like the H358 cells. Therefore, we see that the PSCF algorithm points out proteins and pathways that are highly relevant to the system under study.</p>
<list list-type="simple">
<list-item>
<p>
<monospace>&gt; res &lt;- enrichment_analysis(subnet)</monospace>
</p>
</list-item>
<list-item>
<p>
<monospace>&gt; plot(res$subnet)</monospace>
</p>
</list-item>
</list>
<fig id="pcbi.1005694.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pcbi.1005694.g001</object-id>
<label>Fig 1</label>
<caption>
<title>Functional enrichment analysis of the final subnetwork using the EnrichR API.</title>
<p>The node sizes and edge widths are proportional to the amount of times that node or edge appeared in the noisy runs. Nodes are colored according to cluster membership. As in the EnrichR API, the p-value is calculated using the Fisher test and adjusted for multiple hypotheses. The top 15 functional enrichment terms for each cluster are ranked according to the adjusted p-value and displayed in a tabular format when the mouse hovers over a node in that cluster. Each cluster can be visualized separately by “Select by group” icon located at the top of the figure.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1005694.g001" xlink:type="simple"/>
</fig>
</sec>
</sec>
<sec id="sec009">
<title>Availability and future directions</title>
<p>The source code of the package and the tutorials are available on GitHub at <ext-link ext-link-type="uri" xlink:href="https://github.com/IOR-Bioinformatics/PCSF" xlink:type="simple">https://github.com/IOR-Bioinformatics/PCSF</ext-link>. The package is accompanied with the building and installing documentation, a detailed vignette and reference manual to demonstrate the usage of its functions. We used the MIT open source software license for the package.</p>
<p>The PCSF is a general method and it also can be applied to interpret multi-omics data for functional analysis. We plan to integrate genomic, transcriptomic, proteomic and metabolomic high-throughput data by mapping them onto biological networks and solving the PCSF. Heterogeneous omics data integration is extremely challenging task. At the same time, it is crucial to have overall picture and understanding of cellular mechanism in deep, and develop effective therapeutic strategies for complex diseases. Currently, the bioinformatics community is still missing effective data integration techniques, and we believe our method will be one-step contribution for improving the available methods in the literature.</p>
<p>The last but not least, the proposed package is significantly faster compared to the previous network based PCSF methods, which can analyze large biological networks in a reasonable time.</p>
</sec>
<sec id="sec010">
<title>Supporting information</title>
<supplementary-material id="pcbi.1005694.s001" mimetype="text/html" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1005694.s001" xlink:type="simple">
<label>S1 File</label>
<caption>
<title>A vignette for the package.</title>
<p>(HTML)</p>
</caption>
</supplementary-material>
<supplementary-material id="pcbi.1005694.s002" mimetype="application/pdf" position="float" xlink:href="info:doi/10.1371/journal.pcbi.1005694.s002" xlink:type="simple">
<label>S2 File</label>
<caption>
<title>A reference manual of the package.</title>
<p>(PDF)</p>
</caption>
</supplementary-material>
</sec>
</body>
<back>
<ref-list>
<title>References</title>
<ref id="pcbi.1005694.ref001">
<label>1</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Dittrich</surname> <given-names>M.T.</given-names></name>, <name name-style="western"><surname>Klau</surname> <given-names>G.W.</given-names></name>, <name name-style="western"><surname>Rosenwald</surname> <given-names>A.</given-names></name>, <name name-style="western"><surname>Dandekar</surname> <given-names>T.</given-names></name> and <name name-style="western"><surname>Mueller</surname> <given-names>T</given-names></name>. (<year>2008</year>) <article-title>Identifying functional modules in protein-protein interaction networks: an integrated exact approach</article-title>, <source><italic>Bioinformatics</italic></source>, <volume>24</volume>(<issue>13</issue>), <fpage>i223</fpage>–<lpage>i231</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1093/bioinformatics/btn161" xlink:type="simple">10.1093/bioinformatics/btn161</ext-link></comment> <object-id pub-id-type="pmid">18586718</object-id></mixed-citation>
</ref>
<ref id="pcbi.1005694.ref002">
<label>2</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Beisser</surname> <given-names>D.</given-names></name>, <name name-style="western"><surname>Klau</surname> <given-names>G.W.</given-names></name>, <name name-style="western"><surname>Dandekar</surname> <given-names>T.</given-names></name>, <name name-style="western"><surname>Mueller</surname> <given-names>T.</given-names></name> and <name name-style="western"><surname>Dittrich</surname> <given-names>M</given-names></name>. (<year>2010</year>) <article-title>BioNet: an R-package for the Functional Analysis of Biological Networks</article-title>, <source><italic>Bioinformatics</italic></source>, <volume>26</volume>(<issue>8</issue>), <fpage>1129</fpage>–<lpage>1130</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1093/bioinformatics/btq089" xlink:type="simple">10.1093/bioinformatics/btq089</ext-link></comment> <object-id pub-id-type="pmid">20189939</object-id></mixed-citation>
</ref>
<ref id="pcbi.1005694.ref003">
<label>3</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bailly-Bechet</surname> <given-names>M.</given-names></name>, <name name-style="western"><surname>Borgs</surname> <given-names>C.</given-names></name>, <name name-style="western"><surname>Braunstein</surname> <given-names>A.</given-names></name>, <name name-style="western"><surname>Chayes</surname> <given-names>J.</given-names></name>, <name name-style="western"><surname>Dagkessamanskaia</surname> <given-names>A.</given-names></name>, <name name-style="western"><surname>François</surname> <given-names>J.M.</given-names></name> and <name name-style="western"><surname>Zecchina</surname> <given-names>R</given-names></name>. (<year>2010</year>) <article-title>Finding undetected protein associations in cell signaling by belief propagation</article-title>, <source><italic>PNAS</italic></source>, <volume>108</volume>, <fpage>882</fpage>–<lpage>887</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1073/pnas.1004751108" xlink:type="simple">10.1073/pnas.1004751108</ext-link></comment> <object-id pub-id-type="pmid">21187432</object-id></mixed-citation>
</ref>
<ref id="pcbi.1005694.ref004">
<label>4</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Tuncbag</surname> <given-names>N.</given-names></name>, <name name-style="western"><surname>Gosline</surname> <given-names>S.J.C.</given-names></name>, <name name-style="western"><surname>Kedaigle</surname> <given-names>A.</given-names></name>, <name name-style="western"><surname>Soltis</surname> <given-names>A.R.</given-names></name>, <name name-style="western"><surname>Gitter</surname> <given-names>A.</given-names></name> and <name name-style="western"><surname>Fraenkel</surname> <given-names>E</given-names></name>. (<year>2016</year>) <article-title>Network-Based Interpretation of Diverse High-Throughput Datasets through the Omics Integrator Software Package</article-title>, <source><italic>PLoS Comput Biol</italic></source>, <volume>12</volume>(<issue>4</issue>), <fpage>e1004879</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1371/journal.pcbi.1004879" xlink:type="simple">10.1371/journal.pcbi.1004879</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1005694.ref005">
<label>5</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Akhmedov</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Kwee</surname> <given-names>I</given-names></name>, and <name name-style="western"><surname>Montemanni</surname> <given-names>R</given-names></name>. (<year>2016</year>) <article-title>A divide and conquer matheuristic algorithm for the Prize-collecting Steiner Tree Problem</article-title>, <source><italic>Computers and Operations Research</italic></source>, <volume>70</volume>, <fpage>18</fpage>–<lpage>25</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1016/j.cor.2015.12.015" xlink:type="simple">10.1016/j.cor.2015.12.015</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1005694.ref006">
<label>6</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Akhmedov</surname> <given-names>M.</given-names></name>, <name name-style="western"><surname>LeNail</surname> <given-names>A.</given-names></name>, <name name-style="western"><surname>Bertoni</surname> <given-names>F.</given-names></name>, <name name-style="western"><surname>Kwee</surname> <given-names>I.</given-names></name>, <name name-style="western"><surname>Fraenkel</surname> <given-names>E.</given-names></name> and <name name-style="western"><surname>Montemanni</surname> <given-names>R</given-names></name>. (<year>2017</year>) <article-title>A fast Prize-collecting Steiner Forest algorithm for Functional Analyses in Biological Networks</article-title>, <source><italic>Lecture Notes in Computer Science</italic></source>, <fpage>263</fpage>–<lpage>276</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1007/978-3-319-59776-8_22" xlink:type="simple">10.1007/978-3-319-59776-8_22</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1005694.ref007">
<label>7</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Tuncbag</surname> <given-names>N.</given-names></name>, <name name-style="western"><surname>Braunstein</surname> <given-names>A.</given-names></name>, <name name-style="western"><surname>Pagnani</surname> <given-names>A.</given-names></name>, <name name-style="western"><surname>Huang</surname> <given-names>S.C.</given-names></name>, <name name-style="western"><surname>Chayes</surname> <given-names>J.</given-names></name>, <name name-style="western"><surname>Borgs</surname> <given-names>C.</given-names></name>, <name name-style="western"><surname>Zecchina</surname> <given-names>R</given-names></name>. and <name name-style="western"><surname>Fraenkel</surname> <given-names>E</given-names></name>. <article-title>Simultaneous Reconstruction of Multiple Signaling Pathways via the Prize-Collecting Steiner Forest Problem</article-title>. <source><italic>Journal of Computational Biology</italic></source>, <volume>20</volume>(<issue>2</issue>):<fpage>124</fpage>–<lpage>136</lpage>, <year>2013</year>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1089/cmb.2012.0092" xlink:type="simple">10.1089/cmb.2012.0092</ext-link></comment> <object-id pub-id-type="pmid">23383998</object-id></mixed-citation>
</ref>
<ref id="pcbi.1005694.ref008">
<label>8</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Tuncbag</surname> <given-names>N.</given-names></name>, <name name-style="western"><surname>McCallum</surname> <given-names>S</given-names></name>. <name name-style="western"><surname>Huang</surname> <given-names>S.C.</given-names></name>, and <name name-style="western"><surname>Fraenkel</surname> <given-names>E</given-names></name>. <article-title>SteinerNet: a web server for integrating ‘omic’ data to discover hidden components of response pathways</article-title>. <source><italic>Nucleic Acids Research</italic></source>, <fpage>1</fpage>–<lpage>5</lpage>, <year>2012</year>.</mixed-citation>
</ref>
<ref id="pcbi.1005694.ref009">
<label>9</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Szklarczyk</surname> <given-names>D.</given-names></name>, <name name-style="western"><surname>Franceschini</surname> <given-names>A.</given-names></name>, <name name-style="western"><surname>Kuhn</surname> <given-names>M.</given-names></name>, <name name-style="western"><surname>Simonovic</surname> <given-names>M.</given-names></name>, <name name-style="western"><surname>Roth</surname> <given-names>A.</given-names></name>, <name name-style="western"><surname>Minguez</surname> <given-names>P.</given-names></name>, <name name-style="western"><surname>Doerks</surname> <given-names>T.</given-names></name>, <name name-style="western"><surname>Stark</surname> <given-names>M.</given-names></name>, <name name-style="western"><surname>Muller</surname> <given-names>J.</given-names></name>, <name name-style="western"><surname>Bork</surname> <given-names>P.</given-names></name>, <name name-style="western"><surname>Jensen</surname> <given-names>L.J.</given-names></name> and <name name-style="western"><surname>Mering</surname> <given-names>C.v.</given-names></name> (<year>2011</year>) <article-title>The STRING database in 2011: functional interaction networks of proteins, globally integrated and scored</article-title>, <source><italic>Nucleic Acids Res</italic></source>, <volume>39</volume>, <fpage>D561</fpage>–<lpage>D568</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1093/nar/gkq973" xlink:type="simple">10.1093/nar/gkq973</ext-link></comment> <object-id pub-id-type="pmid">21045058</object-id></mixed-citation>
</ref>
<ref id="pcbi.1005694.ref010">
<label>10</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Wishar</surname> <given-names>D.S.</given-names></name>, <name name-style="western"><surname>Tzur</surname> <given-names>D.</given-names></name>, <name name-style="western"><surname>Knox</surname> <given-names>C.</given-names></name>, <name name-style="western"><surname>Eisner</surname> <given-names>R.</given-names></name>, <name name-style="western"><surname>Guo</surname> <given-names>A.C.</given-names></name>, <name name-style="western"><surname>Young</surname> <given-names>N.</given-names></name>, … and <name name-style="western"><surname>Fung</surname> <given-names>C</given-names></name>. (<year>2007</year>). <article-title>HMDB: the Human Metabolome Database</article-title>. <source>Nucleic Acids Res</source>. 2007 <month>Jan</month>;<volume>35</volume>(<issue>Database issue</issue>):<fpage>D521</fpage>–<lpage>6</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1093/nar/gkl923" xlink:type="simple">10.1093/nar/gkl923</ext-link></comment></mixed-citation>
</ref>
<ref id="pcbi.1005694.ref011">
<label>11</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Mertins</surname> <given-names>P.</given-names></name>, <name name-style="western"><surname>Mani</surname> <given-names>D.R.</given-names></name>, <name name-style="western"><surname>Ruggles</surname> <given-names>K.V.</given-names></name>, <name name-style="western"><surname>Gillette</surname> <given-names>M.A.</given-names></name>, <name name-style="western"><surname>Clauser</surname> <given-names>K.R.</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>P.</given-names></name>, … and <name name-style="western"><surname>Kawaler</surname> <given-names>E</given-names></name>. (<year>2016</year>). <article-title>Proteogenomics connects somatic mutations to signalling in breast cancer</article-title>. <source><italic>Nature</italic></source>, <volume>534</volume>:<fpage>55</fpage>–<lpage>62</lpage>, <month>June</month> 2016. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1038/nature18003" xlink:type="simple">10.1038/nature18003</ext-link></comment> <object-id pub-id-type="pmid">27251275</object-id></mixed-citation>
</ref>
<ref id="pcbi.1005694.ref012">
<label>12</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Thomson</surname> <given-names>S.</given-names></name>, <name name-style="western"><surname>Petti</surname> <given-names>F.</given-names></name>, <name name-style="western"><surname>Sujka-Kwok</surname> <given-names>I.</given-names></name>, <name name-style="western"><surname>Mercado</surname> <given-names>P.</given-names></name>, <name name-style="western"><surname>Bean</surname> <given-names>J.</given-names></name>, <name name-style="western"><surname>Monaghan</surname> <given-names>M.</given-names></name>, <name name-style="western"><surname>Seymour</surname> <given-names>S.L.</given-names></name>, <name name-style="western"><surname>Argast</surname> <given-names>G.M.</given-names></name>, <name name-style="western"><surname>Epstein</surname> <given-names>D.M.</given-names></name> and <name name-style="western"><surname>Haley</surname> <given-names>J.D</given-names></name>. (<year>2011</year>) <article-title>A systems view of epithelial-mesenchymal transition signaling states</article-title>, <source><italic>Clinical &amp; experimental metastasis</italic></source>, <volume>28</volume>(<issue>2</issue>),.</mixed-citation>
</ref>
<ref id="pcbi.1005694.ref013">
<label>13</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Chen</surname> <given-names>E.Y.</given-names></name>, <name name-style="western"><surname>Tan</surname> <given-names>C.M.</given-names></name>, <name name-style="western"><surname>Kou</surname> <given-names>Y.</given-names></name>, <name name-style="western"><surname>Duan</surname> <given-names>Q.</given-names></name>, <name name-style="western"><surname>Wang</surname> <given-names>Z.</given-names></name>, <name name-style="western"><surname>Meirelles</surname> <given-names>G.V.</given-names></name>, <name name-style="western"><surname>Clark</surname> <given-names>N.R.</given-names></name> and <name name-style="western"><surname>Ma’ayan</surname> <given-names>A</given-names></name>. (<year>2013</year>) <article-title>Enrichr: interactive and collaborative HTML5 gene list enrichment analysis tool</article-title>, <source><italic>BMC Bioinformatics</italic></source>, <volume>128</volume>(<issue>14</issue>),.</mixed-citation>
</ref>
<ref id="pcbi.1005694.ref014">
<label>14</label>
<mixed-citation publication-type="other" xlink:type="simple">Alexa A. and Rahnenführer J. (2009). topGO: Enrichment Analysis for Gene Ontology. R package version 2.28.0.</mixed-citation>
</ref>
<ref id="pcbi.1005694.ref015">
<label>15</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Tan</surname> <given-names>Y.H.C.</given-names></name>, <name name-style="western"><surname>Krishnaswamy</surname> <given-names>S.</given-names></name>, <name name-style="western"><surname>Nandi</surname> <given-names>S.</given-names></name>, <name name-style="western"><surname>Kanteti</surname> <given-names>R.</given-names></name>, <name name-style="western"><surname>Vora</surname> <given-names>S.</given-names></name>, <name name-style="western"><surname>Onel</surname> <given-names>K.</given-names></name>, … and <name name-style="western"><surname>Robinson</surname> <given-names>M</given-names></name>. (<year>2010</year>). <article-title>CBL Is Frequently Altered in Lung Cancers: Its Relationship to Mutations in Met and Egfr Tyrosine Kinases</article-title>, <source><italic>PloS One</italic></source>, <volume>5</volume> (<issue>1</issue>), Public Library of Science: <fpage>e8972</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1371/journal.pone.0008972" xlink:type="simple">10.1371/journal.pone.0008972</ext-link></comment> <object-id pub-id-type="pmid">20126411</object-id></mixed-citation>
</ref>
</ref-list>
</back>
</article>