<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">plosone</journal-id>
<journal-title-group>
<journal-title>PLOS ONE</journal-title>
</journal-title-group>
<issn pub-type="epub">1932-6203</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.1371/journal.pone.0232644</article-id>
<article-id pub-id-type="publisher-id">PONE-D-20-11085</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3">
<subject>Physical sciences</subject><subj-group><subject>Materials science</subject><subj-group><subject>Material properties</subject><subj-group><subject>Tractability</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Computer and information sciences</subject><subj-group><subject>Information technology</subject><subj-group><subject>Databases</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Physical sciences</subject><subj-group><subject>Mathematics</subject><subj-group><subject>Applied mathematics</subject><subj-group><subject>Algorithms</subject><subj-group><subject>Machine learning algorithms</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Simulation and modeling</subject><subj-group><subject>Algorithms</subject><subj-group><subject>Machine learning algorithms</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Computer and information sciences</subject><subj-group><subject>Artificial intelligence</subject><subj-group><subject>Machine learning</subject><subj-group><subject>Machine learning algorithms</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Computer and information sciences</subject><subj-group><subject>Artificial intelligence</subject><subj-group><subject>Machine learning</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Computational biology</subject><subj-group><subject>Genome analysis</subject><subj-group><subject>Genome-wide association studies</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Genomics</subject><subj-group><subject>Genome analysis</subject><subj-group><subject>Genome-wide association studies</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Human genetics</subject><subj-group><subject>Genome-wide association studies</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Molecular biology</subject><subj-group><subject>Molecular biology techniques</subject><subj-group><subject>Molecular biology assays and analysis techniques</subject><subj-group><subject>Gene expression and vector techniques</subject><subj-group><subject>Protein expression</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Molecular biology techniques</subject><subj-group><subject>Molecular biology assays and analysis techniques</subject><subj-group><subject>Gene expression and vector techniques</subject><subj-group><subject>Protein expression</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Genetics</subject><subj-group><subject>Genetics of disease</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Mental health and psychiatry</subject><subj-group><subject>Dementia</subject><subj-group><subject>Alzheimer's disease</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Neurology</subject><subj-group><subject>Dementia</subject><subj-group><subject>Alzheimer's disease</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Medical conditions</subject><subj-group><subject>Neurodegenerative diseases</subject><subj-group><subject>Alzheimer's disease</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Neurology</subject><subj-group><subject>Neurodegenerative diseases</subject><subj-group><subject>Alzheimer's disease</subject></subj-group></subj-group></subj-group></subj-group></article-categories>
<title-group>
<article-title>TargetDB: A target information aggregation tool and tractability predictor</article-title>
<alt-title alt-title-type="running-head">TargetDB</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0003-4443-4217</contrib-id>
<name name-style="western">
<surname>De Cesco</surname>
<given-names>Stephane</given-names>
</name>
<role content-type="https://casrai.org/credit/">Conceptualization</role>
<role content-type="https://casrai.org/credit/">Formal analysis</role>
<role content-type="https://casrai.org/credit/">Methodology</role>
<role content-type="https://casrai.org/credit/">Software</role>
<role content-type="https://casrai.org/credit/">Writing – original draft</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"/>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Davis</surname>
<given-names>John B.</given-names>
</name>
<role content-type="https://casrai.org/credit/">Conceptualization</role>
<role content-type="https://casrai.org/credit/">Methodology</role>
<role content-type="https://casrai.org/credit/">Supervision</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"/>
</contrib>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-8950-7646</contrib-id>
<name name-style="western">
<surname>Brennan</surname>
<given-names>Paul E.</given-names>
</name>
<role content-type="https://casrai.org/credit/">Conceptualization</role>
<role content-type="https://casrai.org/credit/">Methodology</role>
<role content-type="https://casrai.org/credit/">Project administration</role>
<role content-type="https://casrai.org/credit/">Resources</role>
<role content-type="https://casrai.org/credit/">Supervision</role>
<role content-type="https://casrai.org/credit/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"/>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
</contrib-group>
<aff id="aff001"><addr-line>Nuffield Department of Medicine, ARUK Oxford Drug Discovery Institute, Target Discovery Institute, University of Oxford, Oxford, United-Kingdom</addr-line></aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Barchi</surname>
<given-names>Joseph J</given-names>
</name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1"><addr-line>National Cancer Institute at Frederick, UNITED STATES</addr-line></aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>No competing interest to declare.</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">paul.brennan@ndm.ox.ac.uk</email> (PEB); <email xlink:type="simple">sdecesco@gmail.com</email> (SDC)</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>2</day>
<month>9</month>
<year>2020</year>
</pub-date>
<pub-date pub-type="collection">
<year>2020</year>
</pub-date>
<volume>15</volume>
<issue>9</issue>
<elocation-id>e0232644</elocation-id>
<history>
<date date-type="received">
<day>17</day>
<month>4</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>28</day>
<month>7</month>
<year>2020</year>
</date>
</history>
<permissions>
<copyright-year>2020</copyright-year>
<copyright-holder>De Cesco et al</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pone.0232644"/>
<abstract>
<p>When trying to identify new potential therapeutic protein targets, access to data and knowledge is increasingly important. In a field where new resources and data sources become available every day, it is crucial to be able to take a step back and look at the wider picture in order to identify potential drug targets. While this task is routinely performed by bespoke literature searches, it is often time-consuming and lacks uniformity when comparing multiple targets at one time. To address this challenge, we developed TargetDB, a tool that aggregates public information available on given target(s) (links to disease, safety, 3D structures, ligandability, novelty, etc.) and assembles it in an easy to read output ready for the researcher to analyze. In addition, we developed a target scoring system based on the desirable attributes of good therapeutic targets and machine learning classification system to categorize novel targets as having promising or challenging tractrability. In this manuscript, we present the methodology used to develop TargetDB as well as test cases.</p>
</abstract>
<funding-group>
<award-group id="award001">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/501100002283</institution-id>
<institution>Alzheimer’s Research UK</institution>
</institution-wrap>
</funding-source>
<award-id>2018DDI-OX</award-id>
</award-group>
<funding-statement>This work was supported by Alzheimer’s Research UK [registered charity 1077089 and SC042474].</funding-statement>
</funding-group>
<counts>
<fig-count count="6"/>
<table-count count="1"/>
<page-count count="12"/>
</counts>
<custom-meta-group>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>All of the data used and code developped for this project is deposited in a GitHub repository (<ext-link ext-link-type="uri" xlink:href="https://github.com/sdecesco/targetDB" xlink:type="simple">https://github.com/sdecesco/targetDB</ext-link>)</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="sec001" sec-type="intro">
<title>Introduction</title>
<p>With the rising availability of genome-wide association data (GWAS) [<xref ref-type="bibr" rid="pone.0232644.ref001">1</xref>], proteomics [<xref ref-type="bibr" rid="pone.0232644.ref002">2</xref>,<xref ref-type="bibr" rid="pone.0232644.ref003">3</xref>], CRISPR [<xref ref-type="bibr" rid="pone.0232644.ref004">4</xref>–<xref ref-type="bibr" rid="pone.0232644.ref006">6</xref>] and RNAi [<xref ref-type="bibr" rid="pone.0232644.ref007">7</xref>], the list of potential protein targets for a given disease is growing rapidly. In this context, researchers are spoilt for choice when it comes to picking a target for further investigation, and yet the failure rate in clinical trials suggests that researchers are routinely failing to select the best targets against which to pitch their drug discovery efforts. To help them in this task, a plethora of excellent publicly available resources exist, such as UniProt [<xref ref-type="bibr" rid="pone.0232644.ref008">8</xref>], DrugBank [<xref ref-type="bibr" rid="pone.0232644.ref009">9</xref>], ChEMBL [<xref ref-type="bibr" rid="pone.0232644.ref010">10</xref>], Open Targets [<xref ref-type="bibr" rid="pone.0232644.ref011">11</xref>], Therapeutic Target Database (TTD) [<xref ref-type="bibr" rid="pone.0232644.ref012">12</xref>], The Drug Gene Interaction database (DGIdb) [<xref ref-type="bibr" rid="pone.0232644.ref013">13</xref>], Target Central Resource Database (TCRD) [<xref ref-type="bibr" rid="pone.0232644.ref014">14</xref>] and many others [<xref ref-type="bibr" rid="pone.0232644.ref015">15</xref>]. While they all provide valuable information, combining all this information in a single place for further analysis or prioritization of a list of targets can become a daunting task. With each data source specializing in different areas such as protein expression, disease association or pharmacology, researchers are required to collate and navigate through a miriad of cross-references in order to paint an accurate portrait of a potential target. Although resources such as UniProt, Pharos/TCRD and Open Targets already propose some aggregation of data, we propose with TargetDB to complement them with additional information such as structurally enabled druggability assessment, area-specific scoring for agile prioritization and a tractability prediction model. More recently, a tool with similar features, TractaViewer, has been described in the literature [<xref ref-type="bibr" rid="pone.0232644.ref016">16</xref>]. While this tool allows the user to classify targets into different bins, it does not provide an area specific score or a general scoring system that can be used for target prioritization. The bin assignment combined with the scoring system of TargetDB, however, could provide valuable information to researchers seeking to assess target tractability.</p>
</sec>
<sec id="sec002" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="sec003">
<title>TargetDB</title>
<p>TargetDB is distributed as a python package and a pre-built SQLite database. The user can also build the database from scratch using a command-line interface in Linux based systems. Details on the database and on how to install the package are available in the Supplementary Information (<xref ref-type="supplementary-material" rid="pone.0232644.s001">S1 File</xref>) and on the GitHub page (<ext-link ext-link-type="uri" xlink:href="https://github.com/sdecesco/targetDB" xlink:type="simple">https://github.com/sdecesco/targetDB</ext-link>).</p>
</sec>
<sec id="sec004">
<title>Data sources</title>
<p>Data used in TargetDB comes from a variety of sources. Some data comes from pre-aggregated/processed data from other databases such as UniProt or TCRD. While others come directly from the source API’s such as Human Protein Atlas for protein expression levels and Open Targets for disease association. The full list of data sources is available in the Supplementary Information (<xref ref-type="supplementary-material" rid="pone.0232644.s001">S1 File</xref>).</p>
</sec>
<sec id="sec005">
<title>Structural assessment of druggability</title>
<p>Fpocket [<xref ref-type="bibr" rid="pone.0232644.ref017">17</xref>] (version 3) was used in order to probe the potential ligandability of queried targets by assessing the presence of protein pockets amenable for small molecule binding (<ext-link ext-link-type="uri" xlink:href="https://github.com/Discngine/fpocket" xlink:type="simple">https://github.com/Discngine/fpocket</ext-link>). For each target in the database, PDB files were downloaded locally and only the smallest biological assembly with a chain representing the target of interest was kept for further analysis. Fpocket was then used with the default parameters and output files read and incorporated into the TargetDB database.</p>
</sec>
<sec id="sec006">
<title>Tractability model</title>
<p>Data collated in TargetDB is then retrieved and used to generate a series of descriptors that are used for: 1) calculate the area-specific overall score, 2) as input for machine learning algorithm in order to predict the target tractability. The final model uses the random forest algorithm from the python package sci-kit-learn [<xref ref-type="bibr" rid="pone.0232644.ref018">18</xref>]. The building of the model is discussed in the results and detailed procedures and code, in the form of a jupyter notebook, and training/testing data are available in the GitHub repository.</p>
</sec>
</sec>
<sec id="sec007" sec-type="results">
<title>Results</title>
<p>Once the program and database are downloaded, TargetDB can be run as a Tkinter graphical interface where different modes can be selected (<xref ref-type="fig" rid="pone.0232644.g001">Fig 1</xref>): Single Mode, List Mode and Spider Plot mode. For each mode, the target(s) of interest need to be specified. In Single Mode, one file is generated per gene entered and, while nothing prevents the user from using this mode for a large number of targets, it is best suited for a handful of genes. For a large number of targets the List Mode is more appropriate, as it produces a single file with several columns that allow the user to prioritize targets according to many attributes. In Spider Plot mode, a graphical spider plot representation of a single target landscape is depicted, representing the amount of knowledge on a target in different areas. This plot is also included in the Single Mode output. An example of each output is available in the supporting information.</p>
<fig id="pone.0232644.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0232644.g001</object-id>
<label>Fig 1</label>
<caption>
<title>TargetDB modes.</title>
<p>These are the available worklflows and recommended usage for the TargetDB output formats.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.g001" xlink:type="simple"/>
</fig>
<sec id="sec008">
<title>Aggregated information about a specific target</title>
<p>The excel document (<xref ref-type="supplementary-material" rid="pone.0232644.s002">S2 File</xref>) generated from the database contains several worksheets with different information regarding the target. The main page contains general information as well as the spider plot. Detailed sheets provided are listed below with a short description.</p>
<sec id="sec009">
<title>Pubmed search</title>
<p>A pubmed search using the gene name as search term is conducted and the 500 most recent publications are listed in the worksheet.</p>
</sec>
<sec id="sec010">
<title>Diseases</title>
<p>This worksheet contains the protein expression (upregulated or downregulated) and GWAS associations for the target in the context of different diseases. This data comes from the Humanmine datasource [<xref ref-type="bibr" rid="pone.0232644.ref019">19</xref>].</p>
</sec>
<sec id="sec011">
<title>Open target association</title>
<p>Disease associations come from the Open Targets platform. The individual disease, disease areas and association type scores are displayed.</p>
</sec>
<sec id="sec012">
<title>Expression</title>
<p>Protein expression levels come from the Human Protein Atlas portal. Numerical values can be interpreted as the following: 3 = High level of expression; 2 = Medium level of expression; 1 = Low level of expression; 0 = Not observed.</p>
</sec>
<sec id="sec013">
<title>Genotypes</title>
<p>List of different mouse genotypes (Knockout, knockdown, etc.) for the target of interest with their associated observed phenotypes. Green color identifies genotypes with no abnormal phenotypes observed, while red indicates a genotype with a lethal phenotype observed.</p>
</sec>
<sec id="sec014">
<title>Isoforms</title>
<p>List of different isoforms with their associated sequence differences.</p>
</sec>
<sec id="sec015">
<title>Variants/Mutants</title>
<p>List of observed variants and mutants along with their sequences and the effect observed if available.</p>
</sec>
<sec id="sec016">
<title>Structure</title>
<p>This worksheet contains a list of all available structures available in the PDB. The code, along with the technique, resolution, chain and sequence coverage, is listed together with information from PDBBind. On top of that, details on domains and their tractability/druggability coming from DrugEbillity is also displayed.</p>
</sec>
<sec id="sec017">
<title>Pockets</title>
<p>After analysis of potential small molecule binding pockets with fpocket3, the results are imported into TargetDB and are displayed in this sheet. The ligandability score is generated directly by the fpocket3 algorithm and we refer the reader to the original paper for more details about the method used to generate this score [<xref ref-type="bibr" rid="pone.0232644.ref020">20</xref>]. As a general guideline, a ligandability binding pocket will have a score of over 0.5, up to a maximum of 1. If multiple pockets are found for a single structure, a complete list of them will be output. If no druggable pocket is found in the target PDB or no PDB is available for the target, a BLAST search is performed on sequences that have a crystal structure deposited in the PDB. A similar pocket analysis is then performed, and the result displayed in the output document with the identified target as well as the sequence similarity between them.</p>
</sec>
<sec id="sec018">
<title>Binding</title>
<p>Bioactivities extracted from ChEMBL contain many different types of data and, while they all provide valuable information, it was decided to segregate the data into different sheets: Binding, Dose-response, Percent Inhibition, ADME and Other bioactivities. The Binding sheet only contains Ki/Kd datapoints. Bioactivities of a given ligand against other targets were collected and used to calculate a selectivity score (Selectivity Entropy—Shannon Entropy [<xref ref-type="bibr" rid="pone.0232644.ref021">21</xref>]), the name of the target for which the ligand has the best bioactivity is also displayed. To provide more information about the ligands, physicochemical properties, as well as the CNS MPO [<xref ref-type="bibr" rid="pone.0232644.ref022">22</xref>] score, are also provided.</p>
</sec>
<sec id="sec019">
<title>Dose-response/Percent-Inhibition/ADME/Other bioactivities</title>
<p>Similar to the above mentioned but with different data types.</p>
</sec>
<sec id="sec020">
<title>BindingDB/Commercial compounds</title>
<p>Similar to the above mentioned with BindingDB as the datasource. The commercial compounds worksheet contains a link to the chemical suppliers of BindingDB ligands for the target.</p>
</sec>
</sec>
<sec id="sec021">
<title>Prioritize a list of candidate targets</title>
<p>The target List Mode report provides the user with more than a hundred different metrics to define a potential target (<xref ref-type="supplementary-material" rid="pone.0232644.s003">S3 File</xref>) such as: number of crystal structures in the PDB, ChEMBL bioactive compounds, Open Targets disease associations, number of antibodies, human protein expression levels in tissues, etc. Such an abundance of available fields makes it hard to quickly identify a target’s profile or else to pick the most relevant parameters for the prioritization process. Therefore, we use a set of rules to define area-specific scores that aid target assessment and prioritization.</p>
<sec id="sec022">
<title>Area-specific scores for rapid target assessment</title>
<p>When evaluating potential targets, building an overall picture of a target profile is not an easy task with the information often fragmented across numerous resources. With TargetDB we have separated information into eight main categories: Druggability, Structure, Biology, Chemistry, Diseases, Genetics, Information and Safety (<xref ref-type="fig" rid="pone.0232644.g002">Fig 2</xref>). Each category is scored from zero to one according to a set of rules (<xref ref-type="supplementary-material" rid="pone.0232644.s001">S1 File</xref>). Once calculated these scores can be used to generate a spider plot of the target profile to rapidly identify the strengths and weaknesses of a given target in each category. From the few examples in <xref ref-type="fig" rid="pone.0232644.g003">Fig 3</xref>, it is easy to identify all these targets are well studied and associated with diseases (neurodegeneration), although only some of these have genetic evidence to support the observation. While acetylcholine esterase and beta-secretase 1 are highly druggable and drugged, it is interesting to note that APOE, one of the main risk factors for Alzheimer’s disease [<xref ref-type="bibr" rid="pone.0232644.ref023">23</xref>], does not score well in the druggability and chemistry area, which is consistent with the poor druggability of an apolipoprotein. These well-characterized examples illustrate how this representation allows for a quick interpretation of a target landscape. A guide for the interpretation of these spider plots is available in <xref ref-type="supplementary-material" rid="pone.0232644.s009">S1 Fig</xref>.</p>
<fig id="pone.0232644.g002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0232644.g002</object-id>
<label>Fig 2</label>
<caption>
<title>Area-specific scores.</title>
<p>Different features that were selected for the generation of the area-specific scores.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.g002" xlink:type="simple"/>
</fig>
<fig id="pone.0232644.g003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0232644.g003</object-id>
<label>Fig 3</label>
<caption>
<title>Spider plot for various targets.</title>
<p>The Height of each section represents the amount of information available in that area for this target. The color in the safety, genetic association, chemistry and structural biology are indications of the safety risk, the significance of associations, the quality of the chemical matter and the druggability of potential binding pockets respectively (Green = better quality/safety Red = poor quality/safety risk).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.g003" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec023">
<title>Multi-Parameter Optimization (MPO) score for target ranking</title>
<p>While ranking targets based on their area score could be used on its own, we also incorporated a customizable MPO score to allow multiple interpretations of the same data. For example, depending on the user interest for a structurally enabled target, it may be advantageous to prioritize targets for which 3D structures are available and with a high druggability score. By simply adjusting the weightings of each category, one can generate a tailored MPO score to facilitate prioritization according to key criteria (<xref ref-type="fig" rid="pone.0232644.g004">Fig 4</xref>). Likewise, negative weights can be set to deprioritize high ranking targets and prioritize low ranking targets, this can be useful if, for example, one wants to deprioritize targets for which there is already significant chemical matter available. The decision on how to set the different weights relies on user judgment and the specific criteria that are of interest to them. As a note of caution, while a user might decide to over-prioritize areas such as structural biology and chemistry it is by no means a guarantee that this will lead to a target with potential therapeutic applications. On the other hand, if a target is over-prioritized for strong disease and genetic links, it may be very difficult to develop safe and effective therapeutics due to low safety and structural druggability scores. This facility also enables users to tailor their searches to highlight targets where there is an opportunity for their research expertise to make a larger impact by picking targets for which there is a lack structural information, lack of chemistry or lack of biology, for example. The detailed methodology on how this MPO score is calculated is available in <xref ref-type="supplementary-material" rid="pone.0232644.s001">S1 File</xref>.</p>
<fig id="pone.0232644.g004" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0232644.g004</object-id>
<label>Fig 4</label>
<caption>
<title>MPO weight input panel.</title>
<p>Interface to enter the individual weights for the construction of the MPO score.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.g004" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec024">
<title>Target tractability model</title>
<p>To further assist the decision-making process on target tractability, it was decided to evaluate whether or not a model of tractability could be built. With the vast amount of information collected, we might uncover trends that would allow classification of targets into tractability classes. To do so, several machine learning algorithms were tested, and their performance evaluated to predict target tractability. In order to train and evaluate the different models we needed to provide each algorithm with an annotated set of tractable and intractable targets. While finding a list of tractable targets is relatively easy, identifying a list of intractable targets proved to be more challenging. We used the DGIdb [<xref ref-type="bibr" rid="pone.0232644.ref013">13</xref>] “clinically actionable” annotated genes as our tractable list of targets (n = 399), while for the intractable control we selected a random set of targets (n = 400) from the list of targets present in TargetDB from which were removed the clinically actionable (n = 399) and the druggable genome (n = 6106) list from DGIdb. This combined set was then split into a training set (n = 560) and testing set (n = 240), each containing the same ratio of tractable/intractable targets. The complete list of targets used in the training and testing of the model is available in the <xref ref-type="supplementary-material" rid="pone.0232644.s004">S4 File</xref>.</p>
<p>After evaluation of multiple algorithms (a detailed procedure is available in <xref ref-type="supplementary-material" rid="pone.0232644.s001">S1 File</xref> as well as the Jupyter notebook in <xref ref-type="supplementary-material" rid="pone.0232644.s005">S5 File</xref>), the Random Forest algorithm was selected for further optimization (<xref ref-type="fig" rid="pone.0232644.g005">Fig 5</xref>). This method provides multiple advantages, such as reducing overfitting, the ability to extract information on features contributing to the decision, and providing an estimate of the confidence of the prediction. This allowed us to narrow down to a set of features that were truly contributing to the performance of the model. The underlying concept of this method is simple: the algorithm creates multiple decision trees; for each decision tree it selects a subset of features from the entire set available; all the decisions from all the trees are then compiled and a classification based on consensus is made for each target. After feature and parameter optimization, the model was evaluated against the test set and was able to accurately predict target tractability 85% of the time. A detailed description of the model performance is available in <xref ref-type="supplementary-material" rid="pone.0232644.s001">S1 File</xref>. The output of this model then provides two (related) readouts: Percentage of trees predicting the target to be tractable and the tractability class of a target (Tractable [&gt;60%] − Challenging [60%-40%] − Intractable [&lt;40%]).</p>
<fig id="pone.0232644.g005" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0232644.g005</object-id>
<label>Fig 5</label>
<caption>
<title>Random forest.</title>
<p>Principle behind the Random Forest Machine learning algorithm.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.g005" xlink:type="simple"/>
</fig>
</sec>
</sec>
</sec>
<sec id="sec025" sec-type="conclusions">
<title>Discussion</title>
<p>To showcase the application of such a tool, we present here a workflow that was used to prioritize potential targets from a list of genes involved in Alzheimer’s diseases provided by the AMP-AD consortium (<ext-link ext-link-type="uri" xlink:href="https://agora.ampadportal.org" xlink:type="simple">https://agora.ampadportal.org</ext-link>). This list consists of 95 targets generated by 6 different teams using computational analysis of genomic, proteomic and/or metabolomic data from human samples [<xref ref-type="bibr" rid="pone.0232644.ref024">24</xref>,<xref ref-type="bibr" rid="pone.0232644.ref025">25</xref>]. Manual aggregation and collation of information for 95 targets is a time-consuming task but the same results can be achieved in only a few minutes using TargetDB. Once the program is started the user has only to input the list of targets in the window and select the run mode (single, list, plot); in our case the “List Mode” was selected. Once started, the program will take a few minutes to retrieve all the information in the database and another window will open to allow the user to input each area weight necessary to calculate a custom MPO score. In our case, the following weights were used: Structural information (= 100), Structural Druggability (= 150), Chemistry (= -100), Biology (= 100), Diseases Links (= 100), Genetic Links (= 150), Literature information (= -100), Safety (= 0). The rationale is that we want to select structurally druggable targets, with no or little chemistry available and with strong genetic associations. Biological information and link to diseases are parameters to consider but not essential and we wanted to deprioritize targets with large amounts of literature available. In this instance, the weight for the safety term was set to zero and was not, therefore, considered in the MPO scoring. Once the weights were entered, the program generates an excel spreadsheet with the list of targets and the calculated area-specific, tractability prediction and MPO scores (<xref ref-type="supplementary-material" rid="pone.0232644.s006">S6</xref> and <xref ref-type="supplementary-material" rid="pone.0232644.s007">S7</xref> Files). This spreadsheet can then be used to further refine the selection according to the user’s preferences.</p>
<p>The same list was independently examined by scientists for target selection. 4 targets were selected for further target validation work and early hit identification. When compared to TargetDB output ranking, 3 of these 4 targets were ranked in the top 10. Assessing these 95 targets took in total a few months and several meetings; it is a good example of how TargetDB may be used to accelerate and focus the attention onto the most promising targets, while not completely discarding the lesser ranked targets for further exploration.</p>
<p>Interestingly, other MPO criteria can be selected depending on the kind of work that is envisioned. For example, a team mainly interested in solving crystal structures might deprioritize targets with a solved crystal structure (Structural information &lt; 0) but still possessing favourable druggability potential calculated from data for close analogs (Structural Druggability ≥ 100) and with some therapeutic rationale (Genetic Links, Disease Links ≥100). These different criteria lead to a ranking significantly different to the first one (<xref ref-type="table" rid="pone.0232644.t001">Table 1</xref>).</p>
<table-wrap id="pone.0232644.t001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0232644.t001</object-id>
<label>Table 1</label> <caption><title>Different MPO scenario.</title></caption>
<alternatives>
<graphic id="pone.0232644.t001g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.t001" xlink:type="simple"/>
<table>
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="center" colspan="2"><underline>SBDD MPO</underline></th>
<th align="center" colspan="2"><underline>Crystallography MPO</underline></th>
</tr>
<tr>
<th align="center">Gene Name</th>
<th align="center">MPO Score</th>
<th align="center">Gene name</th>
<th align="center">MPO Score</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left">GRIN2A</td>
<td align="char" char=".">0.8</td>
<td align="left">SGPL1</td>
<td align="char" char=".">0.73</td>
</tr>
<tr>
<td align="left">PLEC</td>
<td align="char" char=".">0.79</td>
<td align="left">ALK</td>
<td align="char" char=".">0.69</td>
</tr>
<tr>
<td align="left">TGFBR2</td>
<td align="char" char=".">0.78</td>
<td align="left">SYNGAP1</td>
<td align="char" char=".">0.68</td>
</tr>
<tr>
<td align="left"><bold>PLCG2</bold></td>
<td align="char" char=".">0.78</td>
<td align="left">S1PR1</td>
<td align="char" char=".">0.67</td>
</tr>
<tr>
<td align="left">CFH</td>
<td align="char" char=".">0.78</td>
<td align="left">NEFL</td>
<td align="char" char=".">0.67</td>
</tr>
<tr>
<td align="left">TGFB1</td>
<td align="char" char=".">0.76</td>
<td align="left">CSF1R</td>
<td align="char" char=".">0.65</td>
</tr>
<tr>
<td align="left">AP2B1</td>
<td align="char" char=".">0.76</td>
<td align="left"><bold>PLCG2</bold></td>
<td align="char" char=".">0.63</td>
</tr>
<tr>
<td align="left">MSN</td>
<td align="char" char=".">0.74</td>
<td align="left">NR1H4</td>
<td align="char" char=".">0.62</td>
</tr>
<tr>
<td align="left">ERBB3</td>
<td align="char" char=".">0.74</td>
<td align="left">GFAP</td>
<td align="char" char=".">0.62</td>
</tr>
<tr>
<td align="left">TREM2</td>
<td align="char" char=".">0.73</td>
<td align="left">PPARA</td>
<td align="char" char=".">0.62</td>
</tr>
</tbody>
</table>
</alternatives>
<table-wrap-foot>
<fn id="t001fn001"><p>Comparison of the top10 ranked target for two different MPO Score scenarios. Left: Structure based drug design (SBDD). Right: Crystallography.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>Another application is the prioritization of an entire family of proteins. We showcase here how TargetDB was used to rapidly provide an overview of the solute carrier (SLC) family of transporters (<xref ref-type="fig" rid="pone.0232644.g006">Fig 6</xref> and <xref ref-type="supplementary-material" rid="pone.0232644.s008">S8 File</xref>). In less than an hour, we were able to shortlist potential targets based on their predicted tractability class, their MPO score, but also on the potential association with a disease of interest (Alzheimer’s (AD) or Parkinson’s disease (PD) in this case). After further assessment of the top targets, several of them are now under investigation within our institute. This case illustrates how TargetDB can be usefully inserted into the target discovery workflow to expedite as well as standardize the target prioritization process.</p>
<fig id="pone.0232644.g006" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0232644.g006</object-id>
<label>Fig 6</label>
<caption>
<title>Target class analysis.</title>
<p>Summary of the analysis of the Solute Carrier (SLCs) family of transporters performed using TargetDB in list mode as drug targets for Alzheimer’s disease (AD) or Parkinson’s disease (PD). The definition of dark proteome is taken from the Target Central Resource Database [<xref ref-type="bibr" rid="pone.0232644.ref026">26</xref>].</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.g006" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec026" sec-type="conclusions">
<title>Conclusion</title>
<p>In conclusion, we present a tool that allows a researcher to extract/combine and standardize outputs from many different publically accessible databases and to rapidly compare the potential of multiple targets. TargetDB is freely available as a python package and detailed installation instructions are available on the project’s GitHub page as well as in the supporting information. While further improvements and additions are already being considered we encourage other users to participate in the project by adding their own additional datasources.</p>
</sec>
<sec id="sec027">
<title>Supporting information</title>
<supplementary-material id="pone.0232644.s001" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.s001" xlink:type="simple">
<label>S1 File</label>
<caption>
<title>Additional experimental section.</title>
<p>Details of the different methods, datasources and calculations performed for the creation of TargetDB, discussion on the machine learning model.</p>
<p>(DOCX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0232644.s002" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.s002" xlink:type="simple">
<label>S2 File</label>
<caption>
<title>Example of single mode output.</title>
<p>Output from the single mode for the gene BACE1.</p>
<p>(XLSX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0232644.s003" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.s003" xlink:type="simple">
<label>S3 File</label>
<caption>
<title>Description of all the list mode columns.</title>
<p>(XLSX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0232644.s004" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.s004" xlink:type="simple">
<label>S4 File</label>
<caption>
<title>Genes used in the machine learning model.</title>
<p>Excel file with the ID of the genes used in the machine learning model training and testing.</p>
<p>(XLSX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0232644.s005" mimetype="application/zip" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.s005" xlink:type="simple">
<label>S5 File</label>
<caption>
<title>Jupyter notebook and training data.</title>
<p>Archive containing the jupyter notebook used to generate the tractability model.</p>
<p>(ZIP)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0232644.s006" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.s006" xlink:type="simple">
<label>S6 File</label>
<caption>
<title>AMP-AD nominated list—Medicinal chemistry ranking.</title>
<p>(XLSX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0232644.s007" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.s007" xlink:type="simple">
<label>S7 File</label>
<caption>
<title>AMP-AD nominated list—Structural biology ranking.</title>
<p>(XLSX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0232644.s008" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.s008" xlink:type="simple">
<label>S8 File</label>
<caption>
<title>Solute Carrier Protein (SLC) prioritization list.</title>
<p>(XLSX)</p>
</caption>
</supplementary-material>
<supplementary-material id="pone.0232644.s009" mimetype="image/png" position="float" xlink:href="info:doi/10.1371/journal.pone.0232644.s009" xlink:type="simple">
<label>S1 Fig</label>
<caption>
<title>Guide to interpretation of spider plots.</title>
<p>(PNG)</p>
</caption>
</supplementary-material>
</sec>
</body>
<back>
<ack>
<p>We would like to thank the AMP-AD consortium for providing the target list that was evaluated and the entire Oxford Drug Discovery Institute team for the effort put into evaluating these targets as well as providing useful information for the creation of this tool.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pone.0232644.ref001"><label>1</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Visscher</surname> <given-names>PM</given-names></name>, <name name-style="western"><surname>Wray</surname> <given-names>NR</given-names></name>, <name name-style="western"><surname>Zhang</surname> <given-names>Q</given-names></name>, <name name-style="western"><surname>Sklar</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>McCarthy</surname> <given-names>MI</given-names></name>, <name name-style="western"><surname>Brown</surname> <given-names>MA</given-names></name>, <etal>et al</etal>. <article-title>10 Years of GWAS Discovery: Biology, Function, and Translation</article-title>. <source>Am J Hum Genet</source>. <year>2017</year>;<volume>101</volume>: <fpage>5</fpage>–<lpage>22</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.ajhg.2017.06.005" xlink:type="simple">10.1016/j.ajhg.2017.06.005</ext-link></comment> <object-id pub-id-type="pmid">28686856</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref002"><label>2</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Huang</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Mertins</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Cao</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Gunawardena</surname> <given-names>HP</given-names></name>, <name name-style="western"><surname>Ruggles</surname> <given-names>KV.</given-names></name>, <etal>et al</etal>. <article-title>Proteogenomic integration reveals therapeutic targets in breast cancer xenografts</article-title>. <source>Nat Commun</source>. <year>2017</year>;<volume>8</volume>: <fpage>14864</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/ncomms14864" xlink:type="simple">10.1038/ncomms14864</ext-link></comment> <object-id pub-id-type="pmid">28348404</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref003"><label>3</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Korrodi-Gregório</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Soto-Cerrato</surname> <given-names>V</given-names></name>, <name name-style="western"><surname>Vitorino</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Fardilha</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Pérez-Tomás</surname> <given-names>R</given-names></name>. <article-title>From Proteomic Analysis to Potential Therapeutic Targets: Functional Profile of Two Lung Cancer Cell Lines, A549 and SW900, Widely Studied in Pre-Clinical Research</article-title>. <name name-style="western"><surname>Ahmad</surname> <given-names>A</given-names></name>, editor. <source>PLoS One</source>. <year>2016</year>;<volume>11</volume>: <fpage>e0165973</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pone.0165973" xlink:type="simple">10.1371/journal.pone.0165973</ext-link></comment> <object-id pub-id-type="pmid">27814385</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref004"><label>4</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Tian</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Muneeruddin</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Choi</surname> <given-names>MY</given-names></name>, <name name-style="western"><surname>Tao</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Bhuiyan</surname> <given-names>RH</given-names></name>, <name name-style="western"><surname>Ohmi</surname> <given-names>Y</given-names></name>, <etal>et al</etal>. <article-title>Genome-wide CRISPR screens for Shiga toxins and ricin reveal Golgi proteins critical for glycosylation</article-title>. <source>PLOS Biol</source>. <year>2018</year>;<volume>16</volume>: <fpage>e2006951</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pbio.2006951" xlink:type="simple">10.1371/journal.pbio.2006951</ext-link></comment> <object-id pub-id-type="pmid">30481169</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref005"><label>5</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Behan</surname> <given-names>FM</given-names></name>, <name name-style="western"><surname>Iorio</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Picco</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Gonçalves</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Beaver</surname> <given-names>CM</given-names></name>, <name name-style="western"><surname>Migliardi</surname> <given-names>G</given-names></name>, <etal>et al</etal>. <article-title>Prioritization of cancer therapeutic targets using CRISPR–Cas9 screens</article-title>. <source>Nature</source>. <year>2019</year>;<volume>568</volume>: <fpage>511</fpage>–<lpage>516</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41586-019-1103-9" xlink:type="simple">10.1038/s41586-019-1103-9</ext-link></comment></mixed-citation></ref>
<ref id="pone.0232644.ref006"><label>6</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Michaels</surname> <given-names>YS</given-names></name>, <name name-style="western"><surname>Barnkob</surname> <given-names>MB</given-names></name>, <name name-style="western"><surname>Barbosa</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Baeumler</surname> <given-names>TA</given-names></name>, <name name-style="western"><surname>Thompson</surname> <given-names>MK</given-names></name>, <name name-style="western"><surname>Andre</surname> <given-names>V</given-names></name>, <etal>et al</etal>. <article-title>Precise tuning of gene expression levels in mammalian cells</article-title>. <source>Nat Commun</source>. <year>2019</year>;<volume>10</volume>: <fpage>818</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41467-019-08777-y" xlink:type="simple">10.1038/s41467-019-08777-y</ext-link></comment> <object-id pub-id-type="pmid">30778069</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref007"><label>7</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Mohr</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Bakal</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Perrimon</surname> <given-names>N</given-names></name>. <article-title>Genomic Screening with RNAi: Results and Challenges</article-title>. <source>Annu Rev Biochem</source>. <year>2010</year>;<volume>79</volume>: <fpage>37</fpage>–<lpage>64</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1146/annurev-biochem-060408-092949" xlink:type="simple">10.1146/annurev-biochem-060408-092949</ext-link></comment> <object-id pub-id-type="pmid">20367032</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref008"><label>8</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Bateman</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Martin</surname> <given-names>MJ</given-names></name>, <name name-style="western"><surname>O’Donovan</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Magrane</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Alpi</surname> <given-names>E</given-names></name>, <name name-style="western"><surname>Antunes</surname> <given-names>R</given-names></name>, <etal>et al</etal>. <article-title>UniProt: the universal protein knowledgebase</article-title>. <source>Nucleic Acids Res</source>. <year>2017</year>;<volume>45</volume>: <fpage>D158</fpage>–<lpage>D169</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gkw1099" xlink:type="simple">10.1093/nar/gkw1099</ext-link></comment> <object-id pub-id-type="pmid">27899622</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref009"><label>9</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wishart</surname> <given-names>DS</given-names></name>, <name name-style="western"><surname>Feunang</surname> <given-names>YD</given-names></name>, <name name-style="western"><surname>Guo</surname> <given-names>AC</given-names></name>, <name name-style="western"><surname>Lo</surname> <given-names>EJ</given-names></name>, <name name-style="western"><surname>Marcu</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Grant</surname> <given-names>JR</given-names></name>, <etal>et al</etal>. <article-title>DrugBank 5.0: a major update to the DrugBank database for 2018</article-title>. <source>Nucleic Acids Res</source>. <year>2018</year>;<volume>46</volume>: <fpage>D1074</fpage>–<lpage>D1082</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gkx1037" xlink:type="simple">10.1093/nar/gkx1037</ext-link></comment> <object-id pub-id-type="pmid">29126136</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref010"><label>10</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Gaulton</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Hersey</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Nowotka</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Bento</surname> <given-names>AP</given-names></name>, <name name-style="western"><surname>Chambers</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Mendez</surname> <given-names>D</given-names></name>, <etal>et al</etal>. <article-title>The ChEMBL database in 2017</article-title>. <source>Nucleic Acids Res</source>. <year>2017</year>;<volume>45</volume>: <fpage>D945</fpage>–<lpage>D954</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gkw1074" xlink:type="simple">10.1093/nar/gkw1074</ext-link></comment> <object-id pub-id-type="pmid">27899562</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref011"><label>11</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Carvalho-Silva</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Pierleoni</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Pignatelli</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Ong</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Fumis</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Karamanis</surname> <given-names>N</given-names></name>, <etal>et al</etal>. <article-title>Open Targets Platform: new developments and updates two years on</article-title>. <source>Nucleic Acids Res</source>. <year>2019</year>;<volume>47</volume>: <fpage>D1056</fpage>–<lpage>D1065</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gky1133" xlink:type="simple">10.1093/nar/gky1133</ext-link></comment> <object-id pub-id-type="pmid">30462303</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref012"><label>12</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Li</surname> <given-names>YH</given-names></name>, <name name-style="western"><surname>Yu</surname> <given-names>CY</given-names></name>, <name name-style="western"><surname>Li</surname> <given-names>XX</given-names></name>, <name name-style="western"><surname>Zhang</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Tang</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Yang</surname> <given-names>Q</given-names></name>, <etal>et al</etal>. <article-title>Therapeutic target database update 2018: Enriched resource for facilitating bench-to-clinic research of targeted therapeutics</article-title>. <source>Nucleic Acids Res</source>. <year>2018</year>;<volume>46</volume>: <fpage>D1121</fpage>–<lpage>D1127</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gkx1076" xlink:type="simple">10.1093/nar/gkx1076</ext-link></comment> <object-id pub-id-type="pmid">29140520</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref013"><label>13</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Cotto</surname> <given-names>KC</given-names></name>, <name name-style="western"><surname>Wagner</surname> <given-names>AH</given-names></name>, <name name-style="western"><surname>Feng</surname> <given-names>Y-Y</given-names></name>, <name name-style="western"><surname>Kiwala</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Coffman</surname> <given-names>AC</given-names></name>, <name name-style="western"><surname>Spies</surname> <given-names>G</given-names></name>, <etal>et al</etal>. <article-title>DGIdb 3.0: a redesign and expansion of the drug–gene interaction database</article-title>. <source>Nucleic Acids Res</source>. <year>2018</year>;<volume>46</volume>: <fpage>D1068</fpage>–<lpage>D1073</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gkx1143" xlink:type="simple">10.1093/nar/gkx1143</ext-link></comment></mixed-citation></ref>
<ref id="pone.0232644.ref014"><label>14</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Nguyen</surname> <given-names>D-T</given-names></name>, <name name-style="western"><surname>Mathias</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Bologa</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Brunak</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Fernandez</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Gaulton</surname> <given-names>A</given-names></name>, <etal>et al</etal>. <article-title>Pharos: Collating protein information to shed light on the druggable genome</article-title>. <source>Nucleic Acids Res</source>. <year>2017</year>;<volume>45</volume>: <fpage>D995</fpage>–<lpage>D1002</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gkw1072" xlink:type="simple">10.1093/nar/gkw1072</ext-link></comment> <object-id pub-id-type="pmid">27903890</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref015"><label>15</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Rigden</surname> <given-names>DJ</given-names></name>, <name name-style="western"><surname>Fernández</surname> <given-names>XM</given-names></name>. <article-title>The 2018 Nucleic Acids Research database issue and the online molecular biology database collection</article-title>. <source>Nucleic Acids Res</source>. <year>2018</year>;<volume>46</volume>: <fpage>D1</fpage>–<lpage>D7</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gkx1235" xlink:type="simple">10.1093/nar/gkx1235</ext-link></comment> <object-id pub-id-type="pmid">29316735</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref016"><label>16</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Pearson</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Malki</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Evans</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Vidler</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Ruble</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Scherschel</surname> <given-names>J</given-names></name>, <etal>et al</etal>. <article-title>TractaViewer: a genome-wide tool for preliminary assessment of therapeutic target druggability</article-title>. <name name-style="western"><surname>Wren</surname> <given-names>J</given-names></name>, editor. <source>Bioinformatics</source>. <year>2019</year>;<volume>35</volume>: <fpage>4509</fpage>–<lpage>4510</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/bioinformatics/btz270" xlink:type="simple">10.1093/bioinformatics/btz270</ext-link></comment> <object-id pub-id-type="pmid">31070721</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref017"><label>17</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Le Guilloux</surname> <given-names>V</given-names></name>, <name name-style="western"><surname>Schmidtke</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Tuffery</surname> <given-names>P</given-names></name>. <article-title>Fpocket: an open source platform for ligand pocket detection</article-title>. <source>BMC Bioinformatics</source>. <year>2009</year>;<volume>10</volume>: <fpage>168</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-10-168" xlink:type="simple">10.1186/1471-2105-10-168</ext-link></comment> <object-id pub-id-type="pmid">19486540</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref018"><label>18</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Pedregosa</surname> <given-names>F</given-names></name>, <name name-style="western"><surname>Varoquaux</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Gramfort</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Michel</surname> <given-names>V</given-names></name>, <name name-style="western"><surname>Thirion</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Grisel</surname> <given-names>O</given-names></name>, <etal>et al</etal>. <article-title>Scikit-learn: Machine Learning in Python</article-title>. <source>J Mach Learn Res</source>. <year>2011</year>;<volume>12</volume>: <fpage>2825</fpage>–<lpage>2830</lpage>. Available: <ext-link ext-link-type="uri" xlink:href="http://jmlr.csail.mit.edu/papers/v12/pedregosa11a.html" xlink:type="simple">http://jmlr.csail.mit.edu/papers/v12/pedregosa11a.html</ext-link></mixed-citation></ref>
<ref id="pone.0232644.ref019"><label>19</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Kalderimis</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Lyne</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Butano</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Contrino</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Lyne</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Heimbach</surname> <given-names>J</given-names></name>, <etal>et al</etal>. <article-title>InterMine: extensive web services for modern biology</article-title>. <source>Nucleic Acids Res</source>. <year>2014</year>;<volume>42</volume>: <fpage>W468</fpage>–<lpage>W472</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/nar/gku301" xlink:type="simple">10.1093/nar/gku301</ext-link></comment> <object-id pub-id-type="pmid">24753429</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref020"><label>20</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Schmidtke</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Barril</surname> <given-names>X</given-names></name>. <article-title>Understanding and predicting druggability. A high-throughput method for detection of drug binding sites</article-title>. <source>J Med Chem</source>. <year>2010</year>;<volume>53</volume>: <fpage>5858</fpage>–<lpage>5867</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1021/jm100574m" xlink:type="simple">10.1021/jm100574m</ext-link></comment> <object-id pub-id-type="pmid">20684613</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref021"><label>21</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Shannon</surname> <given-names>CE</given-names></name>. <article-title>A Mathematical Theory of Communication</article-title>. <source>Bell Syst Tech J</source>. <year>1948</year>;<volume>27</volume>: <fpage>379</fpage>–<lpage>423</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/j.1538-7305.1948.tb01338.x" xlink:type="simple">10.1002/j.1538-7305.1948.tb01338.x</ext-link></comment></mixed-citation></ref>
<ref id="pone.0232644.ref022"><label>22</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Wager</surname> <given-names>TT</given-names></name>, <name name-style="western"><surname>Hou</surname> <given-names>X</given-names></name>, <name name-style="western"><surname>Verhoest</surname> <given-names>PR</given-names></name>, <name name-style="western"><surname>Villalobos</surname> <given-names>A</given-names></name>. <article-title>Moving beyond Rules: The Development of a Central Nervous System Multiparameter Optimization (CNS MPO) Approach To Enable Alignment of Druglike Properties</article-title>. <source>ACS Chem Neurosci</source>. <year>2010</year>;<volume>1</volume>: <fpage>435</fpage>–<lpage>449</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1021/cn100008c" xlink:type="simple">10.1021/cn100008c</ext-link></comment> <object-id pub-id-type="pmid">22778837</object-id></mixed-citation></ref>
<ref id="pone.0232644.ref023"><label>23</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Stocker</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Möllers</surname> <given-names>T</given-names></name>, <name name-style="western"><surname>Perna</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Brenner</surname> <given-names>H</given-names></name>. <article-title>The genetic risk of Alzheimer’s disease beyond APOE ε4: systematic review of Alzheimer’s genetic risk scores</article-title>. <source>Transl Psychiatry</source>. <year>2018</year>;<volume>8</volume>: <fpage>166</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41398-018-0221-8" xlink:type="simple">10.1038/s41398-018-0221-8</ext-link></comment></mixed-citation></ref>
<ref id="pone.0232644.ref024"><label>24</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>De Jager</surname> <given-names>PL</given-names></name>, <name name-style="western"><surname>Ma</surname> <given-names>Y</given-names></name>, <name name-style="western"><surname>McCabe</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Xu</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Vardarajan</surname> <given-names>BN</given-names></name>, <name name-style="western"><surname>Felsky</surname> <given-names>D</given-names></name>, <etal>et al</etal>. <article-title>A multi-omic atlas of the human frontal cortex for aging and Alzheimer’s disease research</article-title>. <source>Sci Data</source>. <year>2018</year>;<volume>5</volume>: <fpage>180142</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/sdata.2018.142" xlink:type="simple">10.1038/sdata.2018.142</ext-link></comment></mixed-citation></ref>
<ref id="pone.0232644.ref025"><label>25</label><mixed-citation publication-type="journal" xlink:type="simple"><name name-style="western"><surname>Mukherjee</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Perumal</surname> <given-names>TM</given-names></name>, <name name-style="western"><surname>Daily</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Sieberts</surname> <given-names>SK</given-names></name>, <name name-style="western"><surname>Omberg</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Preuss</surname> <given-names>C</given-names></name>, <etal>et al</etal>. <article-title>Identifying and ranking potential driver genes of Alzheimer’s disease using multiview evidence aggregation</article-title>. <source>Bioinformatics</source>. <year>2019</year>;<volume>35</volume>: <fpage>i568</fpage>–<lpage>i576</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/bioinformatics/btz365" xlink:type="simple">10.1093/bioinformatics/btz365</ext-link></comment></mixed-citation></ref>
<ref id="pone.0232644.ref026"><label>26</label><mixed-citation publication-type="other" xlink:type="simple">Target Central Resources Database. [cited 22 Jun 2020]. <ext-link ext-link-type="uri" xlink:href="http://juniper.health.unm.edu/tcrd/" xlink:type="simple">http://juniper.health.unm.edu/tcrd/</ext-link></mixed-citation></ref>
</ref-list>
</back>
<sub-article article-type="aggregated-review-documents" id="pone.0232644.r001" specific-use="decision-letter">
<front-stub>
<article-id pub-id-type="doi">10.1371/journal.pone.0232644.r001</article-id>
<title-group>
<article-title>Decision Letter 0</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name name-style="western">
<surname>Barchi</surname>
<given-names>Joseph J</given-names>
</name>
<role>Academic Editor</role>
</contrib>
</contrib-group>
<permissions>
<copyright-year>2020</copyright-year>
<copyright-holder>Joseph J Barchi</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<related-object document-id="10.1371/journal.pone.0232644" document-id-type="doi" document-type="article" id="rel-obj001" link-type="peer-reviewed-article"/>
<custom-meta-group>
<custom-meta>
<meta-name>Submission Version</meta-name>
<meta-value>0</meta-value>
</custom-meta>
</custom-meta-group>
</front-stub>
<body>
<p>
<named-content content-type="letter-date">5 Jun 2020</named-content>
</p>
<p>PONE-D-20-11085</p>
<p>TargetDB: A target information aggregation tool and tractability predictor</p>
<p>PLOS ONE</p>
<p>Dear Dr. De Cesco,</p>
<p>Thank you for submitting your manuscript to PLOS ONE. After careful consideration, we feel that it has merit but does not fully meet PLOS ONE’s publication criteria as it currently stands. Therefore, we invite you to submit a revised version of the manuscript that addresses the points raised during the review process.</p>
<p>As you can see the 3 reviewers were quite positive overall, and all recommend publication. Please pay attention to the comments and respond accordingly---I would be happy to accept a revised version of this manuscript as soon as I receive and review your modified paper. </p>
<p>Please submit your revised manuscript by Jul 20 2020 11:59PM. If you will need more time than this to complete your revisions, please reply to this message or contact the journal office at <email xlink:type="simple">plosone@plos.org</email>. When you're ready to submit your revision, log on to <ext-link ext-link-type="uri" xlink:href="https://www.editorialmanager.com/pone/" xlink:type="simple">https://www.editorialmanager.com/pone/</ext-link> and select the 'Submissions Needing Revision' folder to locate your manuscript file.</p>
<p>Please include the following items when submitting your revised manuscript:</p>
<p><list list-type="bullet"><list-item><p>A rebuttal letter that responds to each point raised by the academic editor and reviewer(s). You should upload this letter as a separate file labeled 'Response to Reviewers'.</p></list-item><list-item><p>A marked-up copy of your manuscript that highlights changes made to the original version. You should upload this as a separate file labeled 'Revised Manuscript with Track Changes'.</p></list-item><list-item><p>An unmarked version of your revised paper without tracked changes. You should upload this as a separate file labeled 'Manuscript'.</p></list-item></list></p>
<p>If you would like to make changes to your financial disclosure, please include your updated statement in your cover letter. Guidelines for resubmitting your figure files are available below the reviewer comments at the end of this letter.</p>
<p>If applicable, we recommend that you deposit your laboratory protocols in protocols.io to enhance the reproducibility of your results. Protocols.io assigns your protocol its own identifier (DOI) so that it can be cited independently in the future. For instructions see: <ext-link ext-link-type="uri" xlink:href="http://journals.plos.org/plosone/s/submission-guidelines#loc-laboratory-protocols" xlink:type="simple">http://journals.plos.org/plosone/s/submission-guidelines#loc-laboratory-protocols</ext-link></p>
<p>We look forward to receiving your revised manuscript.</p>
<p>Kind regards,</p>
<p>Joseph J Barchi</p>
<p>Academic Editor</p>
<p>PLOS ONE</p>
<p>Journal Requirements:</p>
<p>When submitting your revision, we need you to address these additional requirements.</p>
<p>1. Please ensure that your manuscript meets PLOS ONE's style requirements, including those for file naming. The PLOS ONE style templates can be found at <ext-link ext-link-type="uri" xlink:href="https://journals.plos.org/plosone/s/file?id=wjVg/PLOSOne_formatting_sample_main_body.pdf" xlink:type="simple">https://journals.plos.org/plosone/s/file?id=wjVg/PLOSOne_formatting_sample_main_body.pdf</ext-link> and <ext-link ext-link-type="uri" xlink:href="https://journals.plos.org/plosone/s/file?id=ba62/PLOSOne_formatting_sample_title_authors_affiliations.pdf" xlink:type="simple">https://journals.plos.org/plosone/s/file?id=ba62/PLOSOne_formatting_sample_title_authors_affiliations.pdf</ext-link></p>
<p>2. Please ensure that you refer to Figure 2 in your text as, if accepted, production will need this reference to link the reader to the figure.</p>
<p>3. Please upload a copy of Figure 7, to which you refer in your text. If the figure is no longer to be included as part of the submission please remove all reference to it within the text.</p>
<p>4. Please include captions for your Supporting Information files at the end of your manuscript, and update any in-text citations to match accordingly. Please see our Supporting Information guidelines for more information: <ext-link ext-link-type="uri" xlink:href="about:blank" xlink:type="simple">http://journals.plos.org/plosone/s/supporting-information</ext-link>.</p>
<p>Additional Editor Comments (if provided):</p>
<p>[Note: HTML markup is below. Please do not edit.]</p>
<p>Reviewers' comments:</p>
<p>Reviewer's Responses to Questions</p>
<p><!-- <font color="black"> --><bold>Comments to the Author</bold></p>
<p>1. Is the manuscript technically sound, and do the data support the conclusions?</p>
<p>The manuscript must describe a technically sound piece of scientific research with data that supports the conclusions. Experiments must have been conducted rigorously, with appropriate controls, replication, and sample sizes. The conclusions must be drawn appropriately based on the data presented. <!-- </font> --></p>
<p>Reviewer #1: Yes</p>
<p>Reviewer #2: Yes</p>
<p>Reviewer #3: Yes</p>
<p>**********</p>
<p><!-- <font color="black"> -->2. Has the statistical analysis been performed appropriately and rigorously? <!-- </font> --></p>
<p>Reviewer #1: Yes</p>
<p>Reviewer #2: I Don't Know</p>
<p>Reviewer #3: N/A</p>
<p>**********</p>
<p><!-- <font color="black"> -->3. Have the authors made all data underlying the findings in their manuscript fully available?</p>
<p>The <ext-link ext-link-type="uri" xlink:href="http://www.plosone.org/static/policies.action#sharing" xlink:type="simple">PLOS Data policy</ext-link> requires authors to make all data underlying the findings described in their manuscript fully available without restriction, with rare exception (please refer to the Data Availability Statement in the manuscript PDF file). The data should be provided as part of the manuscript or its supporting information, or deposited to a public repository. For example, in addition to summary statistics, the data points behind means, medians and variance measures should be available. If there are restrictions on publicly sharing data—e.g. participant privacy or use of data from a third party—those must be specified.<!-- </font> --></p>
<p>Reviewer #1: Yes</p>
<p>Reviewer #2: Yes</p>
<p>Reviewer #3: Yes</p>
<p>**********</p>
<p><!-- <font color="black"> -->4. Is the manuscript presented in an intelligible fashion and written in standard English?</p>
<p>PLOS ONE does not copyedit accepted manuscripts, so the language in submitted articles must be clear, correct, and unambiguous. Any typographical or grammatical errors should be corrected at revision, so please note any specific errors here.<!-- </font> --></p>
<p>Reviewer #1: Yes</p>
<p>Reviewer #2: Yes</p>
<p>Reviewer #3: Yes</p>
<p>**********</p>
<p><!-- <font color="black"> -->5. Review Comments to the Author</p>
<p>Please use the space provided to explain your answers to the questions above. You may also include additional comments for the author, including concerns about dual publication, research ethics, or publication ethics. (Please upload your review as an attachment if it exceeds 20,000 characters)<!-- </font> --></p>
<p>Reviewer #1: The authors have developed a handy tool to assist researchers with the challenging task of prioritising a list of potential targets. A large number of various data resources are integrated and final outputs in terms of excel sheets are reported. The ability to adjust weights for main categories is particular useful to customise ranking of targets.</p>
<p>1.) We installed the targetDB package via conda as described on the github page, on MacOS. An initial run failed due to missing xlsxwriter and xlrd packages. Perhaps those dependencies can be mentioned as part of the installation instructions. After installation of those packages the software ran successfully.</p>
<p>2.) Occasionally, an error is thrown, presumably if no protein expression levels are available.</p>
<p>KeyError: "['Muscle tissues', 'Female tissues', 'Bone marrow &amp; lymphoid tissues', 'Liver &amp; gallbladder', 'Proximal digestive tract', 'Gastrointestinal tract', 'Kidney &amp; urinary bladder', 'Male tissues', 'Adipose &amp; soft tissue', 'Endocrine tissues'] not in index"</p>
<p>For example, when entering SLC6A8 and SLC6A5 as the gene list in 'List mode'. These corner cases should be caught and dealt with instead of left just hanging.</p>
<p>3.) There is a spreadsheet called "Not in DB" in List mode. Is this supposed to provide the user with the subset of genes that were not found/matched in the DB? This is useful if dozens of genes were entered and the user can quickly check which genes were not found. However, the spreadsheet is empty at the moment if gene names were not found.</p>
<p>4.) The mode 'Spider plot only' does not give an option to save the produced figure, at least not on MacOS.</p>
<p>5.) A supplementary table should be included listing the 399 tractable targets, 400 intractable targets and their allocation into training and test sets.</p>
<p>6.) Table 1, it is not clear what 'SBDD' stands for.</p>
<p>7.) Figure 6, provide the reader with a short explanation of the 'dark proteome'</p>
<p>8.) What about other tools with very similar functionality, e.g. differences between TargetDB and the recently published TractaViewer should be discussed.</p>
<p>9.) It's somewhat unfortunate that the name "TargetDB" has been used previously for another DB (PMID: 15130928). The authors might want to consider renaming their software/DB, although it seems that this older DB and its original name is not in use anymore.</p>
<p>Reviewer #2: This paper presents a useful tool that aggregates information on a given human gene and presents that information in an easy to read and manipulate format. I can see that this tool would be very useful for prioritising gene targets in the context of early stage drug discovery in industry and also academic pipelines. The ability to up/down-weight the various parameter spaces in terms of the scoring is a nice feature which makes this a generically useful tool.</p>
<p>I was able to download and install the program successfully and run a number of targets through it. I only tested under Linux so cannot say if it would work well under Windows or Mac.</p>
<p>Some comments and requests:</p>
<p>• I note that the supplied database is for ChEMBL 24, which is now quite out of date. I would like to see some instructions on how a newer version of ChEMBL (i.e. 26) can be used, notwithstanding the fact that it’s likely some code changes will be required to accommodate any ChEMBL schema changes</p>
<p>• I would like to see guidance on how the program can be extended in principle. For example, population information on common SNPs, or integration of data from gnomAD.</p>
<p>• The spider plots are very useful visualisations. However, it’s a bit hard to get your head around the filled colour schemes in the single gene output. I would like to see a legend underneath to explain the fill colours to the reader.</p>
<p>• I would like to see a more detailed discussion on the machine learning process and outcomes in the text. Whilst the jupyter notebook is reasonably understandable, more discussion is required on why the exact form of Random Forest was chosen, in the context of the other methods tested. This is important because it gives the community a better understanding of your experience of using a large and diverse parameter space, which others can take advantage of.</p>
<p>• You state that “Safety is not considered in the MPO scoring at this time”. It is not clear to me whether you mean that the MPO weighting is not considered or just that in the example you set this to zero. Please clarify.</p>
<p>• Open Targets is ‘misspelled’ in a number of places. Please use the correct version ‘Open Targets’ consistently.</p>
<p>• Please provide a reference to Humanmine.</p>
<p>• Please can you describe in more detail what the selectivity score is? You specific that it is (selectivity entropy – Shannon entropy) and reference the seminar 1948 information theory paper, but there is not enough information here to reproduce what you are trying to achieve.</p>
<p>• It appears that there are no resolution cut-offs used for structures that go through fpocket analysis. Please can you explain if that is the case and why you feel this is appropriate, if so? An EM structure of &gt;6 Angstroms is going to provide unreliable results in this context, for example.</p>
<p>• What is the sustainability plan for targetDB? Since databases change all the time, how will you ensure that this platform is still usable even in 6 months’ time?</p>
<p>• It is highly unusual to use ellipses in articles. Please remove these and use ‘etc.’ (for example) instead.</p>
<p>• It would be good to have the article carefully proof read for English before it is finally accepted.</p>
<p>Overall, a nice piece of work that I’m sure many will want to use.</p>
<p>Reviewer #3: The authors construct a database application with a graphical interface that aggregates multiple disparate sources of evidence for novel drug target evaluation. They consider measures of druggability, structure, chemistry, biology, disease association, genetic association, general information, and safety when constructing their application. As output they produce different summaries of this evidence - either a summary for a single target, multiple targets, or a graphical summary (aka a spider plot). Furthermore, the authors provide an optimization approach (powered by a machine learning method) to allow users to weight multiple classes of evidence based on the users target validation needs and interests.</p>
<p>Major comments -</p>
<p>Overall the authors provide a potentially useful tool to aid structural biologists, chemists, and assay developers for target prioritization. That being said, I have the following comments:</p>
<p>1. How reproducible are the results generated by this - many of the databases that evidence is being pulled from may change over time. Is there some way to version the results, or to construct queries that refer to a specific version of a public database?</p>
<p>2. The user defined weighting is an interesting idea - I would like to see the authors discuss potential pitfalls of this - e.g. over optimizing for targets with interesting structural biology/chemistry as opposed to targets that will actually lead to therapies or deeper insights into the disease biology.</p>
<p>Minor comments -</p>
<p>1. use of ellipses is distracting (Abstract, Introduction Paragraph 1).</p>
<p>2. “Percentage of threes predicting” - spelling/grammar throughout should be double checked.</p>
<p>3. SBDD acronym in Table 1 is not defined.</p>
<p>**********</p>
<p><!-- <font color="black"> -->6. PLOS authors have the option to publish the peer review history of their article (<ext-link ext-link-type="uri" xlink:href="https://journals.plos.org/plosone/s/editorial-and-peer-review-process#loc-peer-review-history" xlink:type="simple">what does this mean?</ext-link>). If published, this will include your full peer review and any attached files.</p>
<p>If you choose “no”, your identity will remain anonymous but your review may still be made public.</p>
<p><bold>Do you want your identity to be public for this peer review?</bold> For information about this choice, including consent withdrawal, please see our <ext-link ext-link-type="uri" xlink:href="https://www.plos.org/privacy-policy" xlink:type="simple">Privacy Policy</ext-link>.<!-- </font> --></p>
<p>Reviewer #1: No</p>
<p>Reviewer #2: No</p>
<p>Reviewer #3: No</p>
<p>[NOTE: If reviewer comments were submitted as an attachment file, they will be attached to this email and accessible via the submission site. Please log into your account, locate the manuscript record, and check for the action link "View Attachments". If this link does not appear, there are no attachment files.]</p>
<p>While revising your submission, please upload your figure files to the Preflight Analysis and Conversion Engine (PACE) digital diagnostic tool, <ext-link ext-link-type="uri" xlink:href="https://pacev2.apexcovantage.com/" xlink:type="simple">https://pacev2.apexcovantage.com/</ext-link>. PACE helps ensure that figures meet PLOS requirements. To use PACE, you must first register as a user. Registration is free. Then, login and navigate to the UPLOAD tab, where you will find detailed instructions on how to use the tool. If you encounter any issues or have any questions when using PACE, please email PLOS at <email xlink:type="simple">figures@plos.org</email>. Please note that Supporting Information files do not need this step.</p>
</body>
</sub-article>
<sub-article article-type="author-comment" id="pone.0232644.r002">
<front-stub>
<article-id pub-id-type="doi">10.1371/journal.pone.0232644.r002</article-id>
<title-group>
<article-title>Author response to Decision Letter 0</article-title>
</title-group>
<related-object document-id="10.1371/journal.pone.0232644" document-id-type="doi" document-type="peer-reviewed-article" id="rel-obj002" link-type="rebutted-decision-letter" object-id="10.1371/journal.pone.0232644.r001" object-id-type="doi" object-type="decision-letter"/>
<custom-meta-group>
<custom-meta>
<meta-name>Submission Version</meta-name>
<meta-value>1</meta-value>
</custom-meta>
</custom-meta-group>
</front-stub>
<body>
<p>
<named-content content-type="author-response-date">22 Jul 2020</named-content>
</p>
<p>PREFACE: Some answers to reviewers contains figures or equations, therefore, all answers have been added to the cover letter as well</p>
<p>Reviewers’ comments to the authors:</p>
<p>Reviewer #1</p>
<p>The authors have developed a handy tool to assist researchers with the challenging task of prioritising a list of potential targets. A large number of various data resources are integrated and final outputs in terms of excel sheets are reported. The ability to adjust weights for main categories is particular useful to customise ranking of targets.</p>
<p>Answer: We thank the reviewer for their kind words and are happy that he/she finds it useful.</p>
<p>1.) We installed the targetDB package via conda as described on the github page, on MacOS. An initial run failed due to missing xlsxwriter and xlrd packages. Perhaps those dependencies can be mentioned as part of the installation instructions. After installation of those packages the software ran successfully.</p>
<p>Answer: Thanks for the comment, the conda package wasn’t yet created at the time of submission and it hasn’t been tested extensively. As it is another contributor that created the package I asked him to include these packages to the dependency list. </p>
<p>2.) Occasionally, an error is thrown, presumably if no protein expression levels are available.</p>
<p>KeyError: "['Muscle tissues', 'Female tissues', 'Bone marrow &amp; lymphoid tissues', 'Liver &amp; gallbladder', 'Proximal digestive tract', 'Gastrointestinal tract', 'Kidney &amp; urinary bladder', 'Male tissues', 'Adipose &amp; soft tissue', 'Endocrine tissues'] not in index"</p>
<p>For example, when entering SLC6A8 and SLC6A5 as the gene list in 'List mode'. These corner cases should be caught and dealt with instead of left just hanging.</p>
<p>Answer: It has now been fixed in the code in version 1.3.1 of the python package</p>
<p>3.) There is a spreadsheet called "Not in DB" in List mode. Is this supposed to provide the user with the subset of genes that were not found/matched in the DB? This is useful if dozens of genes were entered and the user can quickly check which genes were not found. However, the spreadsheet is empty at the moment if gene names were not found.</p>
<p>Answer: It has now been fixed in the code in version 1.3.1 of the python package</p>
<p>4.) The mode 'Spider plot only' does not give an option to save the produced figure, at least not on MacOS.</p>
<p>Answer: We thank the reviewer for the suggestion, it has now been added to the version 1.3.1 of the python package. </p>
<p>5.) A supplementary table should be included listing the 399 tractable targets, 400 intractable targets and their allocation into training and test sets.</p>
<p>Answer: An additional SI document titled “ML_TrainingTestingSplit_Targets.xlsx” has been added. The document contains two tabs with the testing and training set and each has 2 columns: Target Uniprot ID and Druggability class (1 = Druggable, 0=Intractable) </p>
<p>6.) Table 1, it is not clear what 'SBDD' stands for.</p>
<p>Answer: This has now been clarified in the legend of the table. </p>
<p>7.) Figure 6, provide the reader with a short explanation of the 'dark proteome'</p>
<p>Answer: We have added the following text under the figure: “The definition of dark proteome is taken from the Target Central Resource Database.” Including a reference to the definition on the TCRD platform website ( <ext-link ext-link-type="uri" xlink:href="http://juniper.health.unm.edu/tcrd/" xlink:type="simple">http://juniper.health.unm.edu/tcrd/</ext-link>)</p>
<p>8.) What about other tools with very similar functionality, e.g. differences between TargetDB and the recently published TractaViewer should be discussed.</p>
<p>Answer: A sentence has been added to discuss the differences between the two tools:</p>
<p>“More recently, a tool with similar features, TractaViewer, has been described in the literature [16]. While this tool allows the user to classify targets into different bins, it does not provide an area specific score or a general scoring system that can be used for target prioritization. The bin assignment combined with the scoring system of TargetDB, however, could provide valuable information to researchers seeking to assess target tractability</p>
<p>9.) It's somewhat unfortunate that the name "TargetDB" has been used previously for another DB (PMID: 15130928). The authors might want to consider renaming their software/DB, although it seems that this older DB and its original name is not in use anymore.</p>
<p>Answer: While we certainly agree with the reviewer, we eventually decided not to change the name as, the reviewer pointed out, the older platform has not been in use for a long time. We believe the TargetDB name reflects best the purpose of this tool.  Furthermore, a significant number of academic research teams in the UK and a few pharmaceutical companies are already familiar with the TargetDB name and are using our platform. Therefore, we feel it would be better to continue to use TargetDB</p>
<p>Reviewer #2</p>
<p>This paper presents a useful tool that aggregates information on a given human gene and presents that information in an easy to read and manipulate format. I can see that this tool would be very useful for prioritising gene targets in the context of early stage drug discovery in industry and also academic pipelines. The ability to up/down-weight the various parameter spaces in terms of the scoring is a nice feature which makes this a generically useful tool.</p>
<p>Answer: We thank the reviewer for their kind words and are happy that he/she finds it useful.</p>
<p>I was able to download and install the program successfully and run a number of targets through it. I only tested under Linux so cannot say if it would work well under Windows or Mac.</p>
<p>Some comments and requests:</p>
<p>• I note that the supplied database is for ChEMBL 24, which is now quite out of date. I would like to see some instructions on how a newer version of ChEMBL (i.e. 26) can be used, notwithstanding the fact that it’s likely some code changes will be required to accommodate any ChEMBL schema changes</p>
<p>Answer: The readme file on github has been updated to reflect the fact that the data in the present release has been used with ChEMBL 25. The next update of the database (scheduled for August) will be using ChEMBL 27 or the most recent release at the time of the update.</p>
<p>• I would like to see guidance on how the program can be extended in principle. For example, population information on common SNPs, or integration of data from gnomAD.</p>
<p>Answer: All the source code is available on GitHub and anyone with experience in python can branch the repository to add any valuable information to the output. This may be completed in a couple of steps: </p>
<p>- Convert/parse the data into a pandas dataframe (example of this is in the druggability_DB.py file) and store it as an attribute of the Class Target (line 1290)</p>
<p>- Add this dataframe to the sqlite database (and create a new table) using the function write_to_db() (line 1074 - druggability_DB.py)</p>
<p>- To add it to the output these three files would need to be updated accordingly as well: </p>
<p> targetDB\\druggability_report.py</p>
<p> targetDB\\target_descriptors.py</p>
<p> targetDB\\target_features.py</p>
<p>We have added a sentence to convey this message of collaborative effort more clearly:</p>
<p>“We strongly encourage anyone interested to download the code and participate in the project by adding new datasources and/or features.”</p>
<p>• The spider plots are very useful visualisations. However, it’s a bit hard to get your head around the filled colour schemes in the single gene output. I would like to see a legend underneath to explain the fill colours to the reader.</p>
<p>Answer: We agree that the spider plot combines a lot of data in different forms and a reading guide would be beneficial. We have added a key to the SI (S1_Fig), as well as to the documentation on the github page of the project, to help the user interpret the plot. We hope the reviewers find this useful.</p>
<p>• I would like to see a more detailed discussion on the machine learning process and outcomes in the text. Whilst the jupyter notebook is reasonably understandable, more discussion is required on why the exact form of Random Forest was chosen, in the context of the other methods tested. This is important because it gives the community a better understanding of your experience of using a large and diverse parameter space, which others can take advantage of.</p>
<p>Answer: While we certainly agree with the reviewer that others can take advantage of the process we went through, we believe that the technical details of the model training and evaluation are better suited for the supplemental information (S1 File), where we go into detail about picking/removing collinear features and selection/refinement of the best algorithm. We have added the following sentence to the main text to provide better context to why the random forest algorithm was picked: </p>
<p>“This allowed us to narrow down to a set of features that were truly contributing to the performance of the model.”</p>
<p>• You state that “Safety is not considered in the MPO scoring at this time”. It is not clear to me whether you mean that the MPO weighting is not considered or just that in the example you set this to zero. Please clarify.</p>
<p>Answer: We are sorry this was not more clear. The original meaning was that the weight was set to zero in that specific instance. We have now reformulated the sentence to make it clearer. The sentence now reads: </p>
<p>“ In this instance, the weight for the safety term was set to zero and was not, therefore,  considered in the MPO scoring”</p>
<p>• Open Targets is ‘misspelled’ in a number of places. Please use the correct version ‘Open Targets’ consistently.</p>
<p>Answer: This has now been fixed in the revised manuscript.</p>
<p>• Please provide a reference to Humanmine.</p>
<p>Answer: We are sorry to have missed that, it has been added to the revised manuscript</p>
<p>• Please can you describe in more detail what the selectivity score is? You specific that it is (selectivity entropy – Shannon entropy) and reference the seminar 1948 information theory paper, but there is not enough information here to reproduce what you are trying to achieve.</p>
<p>Answer: A more detailed calculation has been added in the Supporting information S1 File</p>
<p>The Shannon entropy was used as a measure of selectivity for the two following metrics. The global equation is the following:</p>
<p>S_sel=-∑_i^T▒〖ρ_i   log⁡〖ρ_i 〗 〗</p>
<p>With Ssel = Selectivity Entropy</p>
<p>Selectivity of compound</p>
<p> T = Kd for different targets </p>
<p> ρ_i = Probability for a Kd value</p>
<p>ρ_((T) )=〖K_d〗_T /(∑_i▒〖K_d〗_i )</p>
<p> Where KdT = Binding association for target T</p>
<p>Selectivity of tissue expression</p>
<p> T = Expression in different tissue </p>
<p> ρ_i = Probability of an expression value</p>
<p>ρ_((T))=E_T /(∑_i▒〖E_T〗_i )</p>
<p> Where ET = Expression value in tissue T</p>
<p>• It appears that there are no resolution cut-offs used for structures that go through fpocket analysis. Please can you explain if that is the case and why you feel this is appropriate, if so? An EM structure of &gt;6 Angstroms is going to provide unreliable results in this context, for example.</p>
<p>Answer: We thank the reviewer for his suggestion, as of now, it is true that no cut-offs are put in place but this will certainly be implemented in the next release of the database. In the meantime, the information on the resolution of the structure is captured on a different tab and can be used to manually remove any binding pocket result coming from such low resolution structures. (This has been captured as a enhancement request on the GitHub page: <ext-link ext-link-type="uri" xlink:href="https://github.com/sdecesco/targetDB/issues/10" xlink:type="simple">https://github.com/sdecesco/targetDB/issues/10</ext-link>)</p>
<p>• What is the sustainability plan for targetDB? Since databases change all the time, how will you ensure that this platform is still usable even in 6 months’ time?</p>
<p>Answer: As of now two avenues are open, we are committed to update the database bi-annually for the foreseeable future, and are also working on a separate version which would collect data live from various API of these datasources. The disadvantage of the live version would be that it would be slower and would more easily break down if any of the used datasource modify their outputs in a significant manner. </p>
<p>Moreover, one of the main reason to make the entire source code available is to allow anyone with enough experience in python to modulate and/or fix TargetDB in the future.  </p>
<p>• It is highly unusual to use ellipses in articles. Please remove these and use ‘etc.’ (for example) instead.</p>
<p>Answer: Ellipses have been removed in the revised manuscript</p>
<p>• It would be good to have the article carefully proof read for English before it is finally accepted.</p>
<p>Answer: We thank the reviewer for the advice and the manuscript has now been carefully proofread by native English speakers.</p>
<p>Overall, a nice piece of work that I’m sure many will want to use.</p>
<p>Answer: We thank the reviewer again for their kind words.</p>
<p>Reviewer #3</p>
<p>The authors construct a database application with a graphical interface that aggregates multiple disparate sources of evidence for novel drug target evaluation. They consider measures of druggability, structure, chemistry, biology, disease association, genetic association, general information, and safety when constructing their application. As output they produce different summaries of this evidence - either a summary for a single target, multiple targets, or a graphical summary (aka a spider plot). Furthermore, the authors provide an optimization approach (powered by a machine learning method) to allow users to weight multiple classes of evidence based on the users target validation needs and interests.</p>
<p>Major comments -</p>
<p>Overall the authors provide a potentially useful tool to aid structural biologists, chemists, and assay developers for target prioritization. That being said, I have the following comments:</p>
<p>1. How reproducible are the results generated by this - many of the databases that evidence is being pulled from may change over time. Is there some way to version the results, or to construct queries that refer to a specific version of a public database?</p>
<p>Answer: The current model is that the database behind TargetDB is generated at a certain date and time by pulling data from specific versions of databases (which are specified in the supporting information and/or fields in the database itself) or through the API of the sources at that same date (+/- few days as the creation of the TargetDB database takes a few days to complete) </p>
<p>2. The user defined weighting is an interesting idea - I would like to see the authors discuss potential pitfalls of this - e.g. over optimizing for targets with interesting structural biology/chemistry as opposed to targets that will actually lead to therapies or deeper insights into the disease biology.</p>
<p>Answer: This is an interesting and important point raised by the reviewer. Providing this tool of course does not guarantee that it will always be used in a way that leads to therapies. We have added a few words of caution regarding the use of these weights in target prioritization: </p>
<p>“As note of caution, while a user might decide to over-prioritize areas such as structural biology and chemistry it is by no means a guarantee that this will lead to a target with potential therapeutic applications. This facility also enables users to tailor their searches to highlight targets where there is an opportunity for their research expertise to make  an impact; picking targets for which there is a lack structural information, lack of chemistry or even lack of biology, for example On the other hand, if a target is over-prioritized for strong disease and genetic links, it may be very difficult to develop safe and effective therapeutics due to low safety and structural druggability scores.”</p>
<p>Minor comments -</p>
<p>1. use of ellipses is distracting (Abstract, Introduction Paragraph 1).</p>
<p>Answer: These have now been removed from the revised manuscript (see reviewer #2 comments)</p>
<p>2. “Percentage of threes predicting” - spelling/grammar throughout should be double checked.</p>
<p>Answer: Spelling and grammar has now been checked throughout the document</p>
<p>3. SBDD acronym in Table 1 is not defined.</p>
<p>Answer: Definition of the acronym has now been added to the text</p>
</body>
</sub-article>
<sub-article article-type="editor-report" id="pone.0232644.r003" specific-use="decision-letter">
<front-stub>
<article-id pub-id-type="doi">10.1371/journal.pone.0232644.r003</article-id>
<title-group>
<article-title>Decision Letter 1</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name name-style="western">
<surname>Barchi</surname>
<given-names>Joseph J</given-names>
</name>
<role>Academic Editor</role>
</contrib>
</contrib-group>
<permissions>
<copyright-year>2020</copyright-year>
<copyright-holder>Joseph J Barchi</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<related-object document-id="10.1371/journal.pone.0232644" document-id-type="doi" document-type="article" id="rel-obj003" link-type="peer-reviewed-article"/>
<custom-meta-group>
<custom-meta>
<meta-name>Submission Version</meta-name>
<meta-value>1</meta-value>
</custom-meta>
</custom-meta-group>
</front-stub>
<body>
<p>
<named-content content-type="letter-date">29 Jul 2020</named-content>
</p>
<p>TargetDB: A target information aggregation tool and tractability predictor</p>
<p>PONE-D-20-11085R1</p>
<p>Dear Dr. De Cesco,</p>
<p>We’re pleased to inform you that your manuscript has been judged scientifically suitable for publication and will be formally accepted for publication once it meets all outstanding technical requirements.</p>
<p>Within one week, you’ll receive an e-mail detailing the required amendments. When these have been addressed, you’ll receive a formal acceptance letter and your manuscript will be scheduled for publication.</p>
<p>An invoice for payment will follow shortly after the formal acceptance. To ensure an efficient process, please log into Editorial Manager at <ext-link ext-link-type="uri" xlink:href="http://www.editorialmanager.com/pone/" xlink:type="simple">http://www.editorialmanager.com/pone/</ext-link>, click the 'Update My Information' link at the top of the page, and double check that your user information is up-to-date. If you have any billing related questions, please contact our Author Billing department directly at <email xlink:type="simple">authorbilling@plos.org</email>.</p>
<p>If your institution or institutions have a press office, please notify them about your upcoming paper to help maximize its impact. If they’ll be preparing press materials, please inform our press team as soon as possible -- no later than 48 hours after receiving the formal acceptance. Your manuscript will remain under strict press embargo until 2 pm Eastern Time on the date of publication. For more information, please contact <email xlink:type="simple">onepress@plos.org</email>.</p>
<p>Kind regards,</p>
<p>Joseph J Barchi</p>
<p>Academic Editor</p>
<p>PLOS ONE</p>
<p>Additional Editor Comments (optional):</p>
<p>Reviewers' comments:</p>
</body>
</sub-article>
<sub-article article-type="editor-report" id="pone.0232644.r004" specific-use="acceptance-letter">
<front-stub>
<article-id pub-id-type="doi">10.1371/journal.pone.0232644.r004</article-id>
<title-group>
<article-title>Acceptance letter</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name name-style="western">
<surname>Barchi</surname>
<given-names>Joseph J</given-names>
</name>
<role>Academic Editor</role>
</contrib>
</contrib-group>
<permissions>
<copyright-year>2020</copyright-year>
<copyright-holder>Joseph J Barchi</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<related-object document-id="10.1371/journal.pone.0232644" document-id-type="doi" document-type="article" id="rel-obj004" link-type="peer-reviewed-article"/>
</front-stub>
<body>
<p>
<named-content content-type="letter-date">3 Aug 2020</named-content>
</p>
<p>PONE-D-20-11085R1 </p>
<p>TargetDB: A target information aggregation tool and tractability predictor </p>
<p>Dear Dr. De Cesco:</p>
<p>I'm pleased to inform you that your manuscript has been deemed suitable for publication in PLOS ONE. Congratulations! Your manuscript is now with our production department. </p>
<p>If your institution or institutions have a press office, please let them know about your upcoming paper now to help maximize its impact. If they'll be preparing press materials, please inform our press team within the next 48 hours. Your manuscript will remain under strict press embargo until 2 pm Eastern Time on the date of publication. For more information please contact <email xlink:type="simple">onepress@plos.org</email>.</p>
<p>If we can help with anything else, please email us at <email xlink:type="simple">plosone@plos.org</email>. </p>
<p>Thank you for submitting your work to PLOS ONE and supporting open access. </p>
<p>Kind regards, </p>
<p>PLOS ONE Editorial Office Staff</p>
<p>on behalf of</p>
<p>Dr. Joseph J Barchi  </p>
<p>Academic Editor</p>
<p>PLOS ONE</p>
</body>
</sub-article>
</article>