<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.1d3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id>
<journal-id journal-id-type="publisher-id">plos</journal-id>
<journal-id journal-id-type="pmc">plosone</journal-id>
<journal-title-group>
<journal-title>PLOS ONE</journal-title>
</journal-title-group>
<issn pub-type="epub">1932-6203</issn>
<publisher>
<publisher-name>Public Library of Science</publisher-name>
<publisher-loc>San Francisco, CA USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">PONE-D-18-17903</article-id>
<article-id pub-id-type="doi">10.1371/journal.pone.0205219</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research Article</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>A fully automated, faster noise rejection approach to increasing the analytical capability of chemical imaging for digital histopathology</article-title>
<alt-title alt-title-type="running-head">Noise reduction and spectral chemical imaging</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0001-8145-9347</contrib-id>
<name name-style="western">
<surname>Gupta</surname> <given-names>Soumyajit</given-names></name>
<role content-type="http://credit.casrai.org/">Data curation</role>
<role content-type="http://credit.casrai.org/">Formal analysis</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Software</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" equal-contrib="yes" xlink:type="simple">
<name name-style="western">
<surname>Mittal</surname> <given-names>Shachi</given-names></name>
<role content-type="http://credit.casrai.org/">Data curation</role>
<role content-type="http://credit.casrai.org/">Investigation</role>
<role content-type="http://credit.casrai.org/">Validation</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Kajdacsy-Balla</surname> <given-names>Andre</given-names></name>
<role content-type="http://credit.casrai.org/">Validation</role>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author" xlink:type="simple">
<name name-style="western">
<surname>Bhargava</surname> <given-names>Rohit</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Project administration</role>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes" xlink:type="simple">
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-9619-3278</contrib-id>
<name name-style="western">
<surname>Bajaj</surname> <given-names>Chandrajit</given-names></name>
<role content-type="http://credit.casrai.org/">Conceptualization</role>
<role content-type="http://credit.casrai.org/">Methodology</role>
<role content-type="http://credit.casrai.org/">Project administration</role>
<role content-type="http://credit.casrai.org/">Supervision</role>
<role content-type="http://credit.casrai.org/">Writing – original draft</role>
<role content-type="http://credit.casrai.org/">Writing – review &amp; editing</role>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="corresp" rid="cor001">*</xref>
</contrib>
</contrib-group>
<aff id="aff001">
<label>1</label>
<addr-line>Department of Computer Science, Computational Visualization Center, University of Texas at Austin, Austin, Texas 78705, United States of America</addr-line>
</aff>
<aff id="aff002">
<label>2</label>
<addr-line>Department of Bioengineering, University of Illinois, Urbana Champaign, Urbana, Illinois 61801, United States of America</addr-line>
</aff>
<aff id="aff003">
<label>3</label>
<addr-line>Department of Pathology, University of Illinois at Chicago, Chicago, Illinois 60612, United States of America</addr-line>
</aff>
<contrib-group>
<contrib contrib-type="editor" xlink:type="simple">
<name name-style="western">
<surname>Metze</surname> <given-names>Konradin</given-names></name>
<role>Editor</role>
<xref ref-type="aff" rid="edit1"/>
</contrib>
</contrib-group>
<aff id="edit1">
<addr-line>University of Campinas, BRAZIL</addr-line>
</aff>
<author-notes>
<fn fn-type="conflict" id="coi001">
<p>The authors have declared that no competing interests exist.</p>
</fn>
<corresp id="cor001">* E-mail: <email xlink:type="simple">bajaj@cs.utexas.edu</email></corresp>
</author-notes>
<pub-date pub-type="collection">
<year>2019</year>
</pub-date>
<pub-date pub-type="epub">
<day>24</day>
<month>4</month>
<year>2019</year>
</pub-date>
<volume>14</volume>
<issue>4</issue>
<elocation-id>e0205219</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>6</month>
<year>2018</year>
</date>
<date date-type="accepted">
<day>6</day>
<month>4</month>
<year>2019</year>
</date>
</history>
<permissions>
<copyright-year>2019</copyright-year>
<copyright-holder>Gupta et al</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.1371/journal.pone.0205219"/>
<abstract>
<p>Chemical hyperspectral imaging (HSI) data is naturally high dimensional and large. There are thus inherent manual trade-offs in acquisition time, and the quality of data. Minimum Noise Fraction (MNF) developed by Green <italic>et al</italic>. [<xref ref-type="bibr" rid="pone.0205219.ref001">1</xref>] has been extensively studied as a method for noise removal in HSI data. It too, however entails a manual speed-accuracy trade-off, namely the process of manually selecting the relevant bands in the MNF space. This process currently takes roughly around a month’s time for acquiring and pre-processing an entire TMA with acceptable signal to noise ratio. We present three approaches termed ‘Fast MNF’, ‘Approx MNF’ and ‘Rand MNF’ where the computational time of the algorithm is reduced, as well as the entire process of band selection is fully automated. This automated approach is shown to perform at the same level of accuracy as MNF with now large speedup factors, resulting in the same task to be accomplished in hours. The different approximations produced by the three algorithms, show the reconstruction accuracy vs storage (50×) and runtime speed (60×) trade-off. We apply the approach for automating the denoising of different tissue histology samples, in which the accuracy of classification (differentiating between the different histologic and pathologic classes) strongly depends on the SNR (signal to noise ratio) of recovered data. Therefore, we also compare the effect of the proposed denoising algorithms on classification accuracy. Since denoising HSI data is done unsupervised, we also use a metric that assesses the quality of denoising in the image domain between the noisy and denoised image in the absence of ground truth.</p>
</abstract>
<funding-group>
<award-group id="award001">
<funding-source>
<institution-wrap>
<institution-id institution-id-type="funder-id">http://dx.doi.org/10.13039/100000002</institution-id>
<institution>National Institutes of Health</institution>
</institution-wrap>
</funding-source>
<award-id>R01GM117594</award-id>
<principal-award-recipient>
<contrib-id authenticated="true" contrib-id-type="orcid">http://orcid.org/0000-0002-9619-3278</contrib-id>
<name name-style="western">
<surname>Bajaj</surname> <given-names>Chandrajit</given-names></name>
</principal-award-recipient>
</award-group>
<funding-statement>This research was supported in part by NIH grants R01GM117594, R41GM116300 and Dell-Seton 201602388.</funding-statement>
</funding-group>
<counts>
<fig-count count="6"/>
<table-count count="1"/>
<page-count count="15"/>
</counts>
<custom-meta-group>
<custom-meta id="data-availability">
<meta-name>Data Availability</meta-name>
<meta-value>All relevant data are within the paper and its Supporting Information files.</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="sec001" sec-type="intro">
<title>Introduction</title>
<p>Chemical imaging is an emerging technology in which every pixel or voxel of an image contains hyperspectral data, often consisting of hundreds or thousands of data points. The spectrum at each pixel resolves the chemical components at that point and, thus, provides the molecular profile of the sample [<xref ref-type="bibr" rid="pone.0205219.ref002">2</xref>–<xref ref-type="bibr" rid="pone.0205219.ref004">4</xref>]. Computer algorithms that can process the data to information useful for a particular problem often require a specific data quality, at that spectral resolution, that often determines scanning (signal averaging) time. In addition to the chemical signature of the data, another benefit of modern technologies including machine learning is that workflows can be automated with fully digital structure and function analysis of the data [<xref ref-type="bibr" rid="pone.0205219.ref005">5</xref>–<xref ref-type="bibr" rid="pone.0205219.ref008">8</xref>]. For example, Fourier Transform Infrared (FT-IR) spectroscopic imaging is emerging as an automated alternative to human examination in studying disease development and progression by using statistical pattern recognition [<xref ref-type="bibr" rid="pone.0205219.ref009">9</xref>–<xref ref-type="bibr" rid="pone.0205219.ref014">14</xref>]. For a practical protocol for tissue imaging, as demonstrated in at least one instance of tissue histopathology, the signal-to-noise ratio (SNR) of 4<italic>cm</italic><sup>−1</sup> resolution spectral data needs to be more than 1000: 1 [<xref ref-type="bibr" rid="pone.0205219.ref013">13</xref>]. To achieve this SNR, especially for the emerging high definition IR imaging [<xref ref-type="bibr" rid="pone.0205219.ref015">15</xref>–<xref ref-type="bibr" rid="pone.0205219.ref017">17</xref>], extensive signal averaging is required. The need for signal averaging increases processing time <inline-formula id="pone.0205219.e001"><alternatives><graphic id="pone.0205219.e001g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e001" xlink:type="simple"/><mml:math display="inline" id="M1"><mml:mrow><mml:mo>(</mml:mo> <mml:mtext>SNR</mml:mtext> <mml:mo>∼</mml:mo> <mml:msqrt><mml:mi>t</mml:mi></mml:msqrt> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>, in turn, increasing acquisition time [<xref ref-type="bibr" rid="pone.0205219.ref018">18</xref>] to the extent that clinical translation becomes impractical. Signal processing approaches to reduce noise has previously been suggested to mitigate this crippling increase in integration time by mathematical methods to utilize correlations in data to reduce noise but suffer from two major drawbacks. First, given the large size of the data, the mathematical operations require computer processing often comparable to the acquisition time itself [<xref ref-type="bibr" rid="pone.0205219.ref019">19</xref>]. Second, such methods invariably try to separate data into informative and noisy components; subsequently, a manual selection step is required to identify the information-bearing components thus compromising the automation benefits of using spectroscopic imaging for tissue analysis [<xref ref-type="bibr" rid="pone.0205219.ref020">20</xref>].</p>
<p>One class of mathematical transform techniques for noise reduction utilize the property that noise is uncorrelated whereas spectra (signals) have a high degree of correlation. In a transform domain, hence, the signal becomes largely confined to a few eigenvalues whereas the noise is spread across all. Noise reduction can be achieved by retaining eigenvalue images that correspond to high signal content and computing the inverse transform. All the eigenvalue data contain signal and noise but the relative proportion of the signal to noise which forms a threshold criterion for inclusion of specific eigen-images in the inverse transform. Inclusion of too many will not allow for significant noise rejection, while inclusion of too few would result in loss of fine spectral features. Hence, identifying eigenvalues corresponding to high signal content is an important step in the noise reduction process.</p>
<p>One widely used algorithm was provided by Green <italic>et al</italic>. [<xref ref-type="bibr" rid="pone.0205219.ref001">1</xref>] that applies Minimum Noise Fraction (MNF) to order spectral components in terms of SNR in the transformed space. It assumes that the covariance for the raw data Σ<sub><italic>Y</italic></sub> and the noise Σ<sub><italic>δ</italic></sub> can both be estimated. Similar to principal component analysis (PCA) that orders the components in terms of variance, after transformation in MNF space, the top components are chosen and filtered and rest are zeroed out. This reduced basis is then used for inverse transformation into the signal space. Noise Adjusted Principal Components (NAPC) transform by Lee <italic>et al</italic>. [<xref ref-type="bibr" rid="pone.0205219.ref021">21</xref>] is a reformulation of the MNF transform in terms of noise whitening process. While MNF and NAPC transforms are mathematically equivalent, the latter consists of a sequence of two principal component transforms: First to whiten the data (de-correlate noise from data); Second to perform eigen decomposition on the modified covariance matrix, to order the underlying data by SNR.</p>
<p>Our goals in this work are to address the major challenges in noise rejection using mathematical methods. Specifically, first, we aim to provide criteria for unsupervised band selection, thereby maintaining objectivity of the data analysis protocol and reducing analysis time within the data processing pipeline by dispensing with the need for manual intervention. Second, we aim to re-examine the mathematical formulation of the MNF approach to speed up the process of computation of the forward and inverse transform MNF vectors. Specifically, we examine two novel approaches: (a) use of a truncated singular value decomposition (SVD) variant that is computationally more efficient, and (b) the use of a randomized variant of the above that is also memory efficient and has a reconstruction accuracy-memory trade-off depending on the application. Finally, we seek to improve the signal processing methods to provide a higher confidence in the consistency and accuracy of the noise rejection pipeline. We propose a comparison between acquired and denoised biomedical images using a robust metric, thereby providing better denoising guarantees in terms of both root mean square error (RMSE) and structural similarity.</p>
</sec>
<sec id="sec002" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="sec003">
<title>Sample preparation and data collection</title>
<p>A paraffin embedded breast tissue microarray (<italic>BR</italic>1003) consisting of 101 cores were obtained from US Biomax, Inc. The unstained sections of the TMA were placed on a <italic>BaF</italic><sub>2</sub> salt plate for IR imaging. The sections were deparaffinized using a 24<italic>h</italic> hexane bath. High Definition data was acquired using the Agilent Stingray imaging system with 0.62 numerical aperture and a 128 × 128 focal plane array. A spectral resolution of 4<italic>cm</italic><sup>−1</sup> along with a pixel size of 1.1<italic>μm</italic> was obtained at the sample plane. The final FTIR sample has a spatial dimension of 11620 × 11620 pixels and spectral dimension of 1506 channels.</p>
</sec>
<sec id="sec004">
<title>Classification</title>
<p>A random forest classifier was used to differentiate between the different histologic classes of a tissue sample. Labeled pixels for each class were obtained by the cases annotated by a pathologist. The pathologist distinguishes dense from loose collagen just by looking at the density of the collagen fibers that are elucidated by the Hematoxylin and Eosin (H&amp;E) stain. Pre-cancerous and malignant epithelium are also identified using the H&amp;E stained images as these images are high resolution images that provide contrast in different cell types in the tissue. These images are used to delineate nuclear architectures, shapes and sizes. These cellular features along with the presence of basal cells and the extent of cellular growth are used to confirm the disease state. On the other hand, while infrared imaging does not provide as much spatial detail but offers a wide variety of molecular signatures that help in disease detection despite the lower resolution.</p>
<p>In this study, we have used a four class model separating benign epithelium from malignant epithelium. Finally, to assess the performance of the classifier, sensitivity and specificity is calculated for all the classes to generate the receiver operating characteristic curve. The area under this curve signifies the diagnostic potential of the model.</p>
</sec>
</sec>
<sec id="sec005" sec-type="materials|methods">
<title>Methods</title>
<p>In practical situations, noiseless data <italic>d</italic><sub><italic>j</italic></sub> is recorded by instruments as a noisy signal estimate <italic>y</italic><sub><italic>j</italic></sub>, due to fluctuations in detector current, backgrounds and source/instrument factors, which is modeled as:
<disp-formula id="pone.0205219.e002"><alternatives><graphic id="pone.0205219.e002g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e002" xlink:type="simple"/><mml:math display="block" id="M2"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:msub><mml:mi>y</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:msub><mml:mi>d</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>δ</mml:mi> <mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(1)</label></disp-formula>
where <inline-formula id="pone.0205219.e003"><alternatives><graphic id="pone.0205219.e003g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e003" xlink:type="simple"/><mml:math display="inline" id="M3"><mml:mrow><mml:msub><mml:mi>y</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>∈</mml:mo> <mml:msup><mml:mi mathvariant="double-struck">R</mml:mi> <mml:mi>S</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula> is the actual data collected by the apparatus and <inline-formula id="pone.0205219.e004"><alternatives><graphic id="pone.0205219.e004g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e004" xlink:type="simple"/><mml:math display="inline" id="M4"><mml:mrow><mml:msub><mml:mi>δ</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>∈</mml:mo> <mml:msup><mml:mi mathvariant="double-struck">R</mml:mi> <mml:mi>S</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula> is the noise in the same pixel. The goal is to estimate <italic>δ</italic><sub><italic>j</italic></sub> given <italic>y</italic><sub><italic>j</italic></sub>, so we can best estimate the true signal <italic>d</italic><sub><italic>j</italic></sub> such that the relevant features (peak positions, peak heights, relative peak spacing etc.) in the spectrum are preserved.</p>
<p>Given a HSI <inline-formula id="pone.0205219.e005"><alternatives><graphic id="pone.0205219.e005g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e005" xlink:type="simple"/><mml:math display="inline" id="M5"><mml:mrow><mml:msub><mml:mi>Y</mml:mi> <mml:mrow><mml:mi>o</mml:mi> <mml:mi>r</mml:mi> <mml:mi>i</mml:mi> <mml:mi>g</mml:mi></mml:mrow></mml:msub> <mml:mo>∈</mml:mo> <mml:msup><mml:mi mathvariant="double-struck">R</mml:mi> <mml:mrow><mml:mi>W</mml:mi> <mml:mo>×</mml:mo> <mml:mi>H</mml:mi> <mml:mo>×</mml:mo> <mml:mi>S</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:math></alternatives></inline-formula>, where <italic>W</italic>, <italic>H</italic> are the spatial dimensions (width and height respectively), it has been restructured into a 2<italic>D</italic> matrix <inline-formula id="pone.0205219.e006"><alternatives><graphic id="pone.0205219.e006g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e006" xlink:type="simple"/><mml:math display="inline" id="M6"><mml:mrow><mml:mi>Y</mml:mi> <mml:mo>∈</mml:mo> <mml:msup><mml:mi mathvariant="double-struck">R</mml:mi> <mml:mrow><mml:mi>N</mml:mi> <mml:mo>×</mml:mo> <mml:mi>S</mml:mi></mml:mrow></mml:msup></mml:mrow></mml:math></alternatives></inline-formula>, where <italic>N</italic> = (<italic>W</italic> × <italic>H</italic>) is the number of pixels, <italic>S</italic> is the number of spectral channels. Each column <italic>y</italic><sub><italic>i</italic></sub>, ∀<italic>i</italic> = [1: <italic>S</italic>] represents the reshaped image for the <italic>i</italic><sup><italic>th</italic></sup> spectral band and each row <italic>y</italic><sub><italic>j</italic></sub>, ∀<italic>j</italic> = [1: <italic>N</italic>] represents the spectral signature for the <italic>j</italic><sup><italic>th</italic></sup> pixel. The <italic>i</italic><sup><italic>th</italic></sup> entry of the spectral vector <inline-formula id="pone.0205219.e007"><alternatives><graphic id="pone.0205219.e007g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e007" xlink:type="simple"/><mml:math display="inline" id="M7"><mml:mrow><mml:msub><mml:mi>y</mml:mi> <mml:mi>j</mml:mi></mml:msub> <mml:mo>∈</mml:mo> <mml:msup><mml:mi mathvariant="double-struck">R</mml:mi> <mml:mi>S</mml:mi></mml:msup></mml:mrow></mml:math></alternatives></inline-formula> of each pixel <italic>y</italic><sub><italic>ij</italic></sub> determines the absorbance value of the tissue at that wavenumber. Wavenumbers <italic>ν</italic> are defined as inverse of wavelength and have units <italic>cm</italic><sup>−1</sup>. The recorded value at each wavenumber has unit <italic>absorbance</italic>/<italic>au</italic>, where <italic>au</italic> is arbitrary unit.</p>
<sec id="sec006">
<title>Mathematical background</title>
<p>Assuming additive noise only, raw data can be represented as <italic>Y</italic> = <italic>D</italic> + <italic>δ</italic>, where <italic>Y</italic> = {<italic>Y</italic><sub>1</sub>, …, <italic>Y</italic><sub><italic>S</italic></sub>} and <italic>D</italic> and <italic>δ</italic> are the uncorrelated signal (actual spectral data with baseline included) and noise components of the raw data <italic>Y</italic>. <italic>Cov</italic>{<italic>Y</italic>} = Σ<sub><italic>Y</italic></sub> = Σ<sub><italic>D</italic></sub> + Σ<sub><italic>δ</italic></sub>, where Σ<sub><italic>D</italic></sub> and Σ<sub><italic>δ</italic></sub> are the covariance matrices of <italic>D</italic> and <italic>δ</italic> respectively. Noise Fraction (NF) for the <italic>i</italic><sup><italic>th</italic></sup> band is defined as the ratio of noise variance to the total variance for that band. Similarly Signal to Noise ratio (SNR) for the <italic>i</italic><sup><italic>th</italic></sup> band is defined as the ratio of signal variance to the noise variance for that band.
<disp-formula id="pone.0205219.e008"><alternatives><graphic id="pone.0205219.e008g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e008" xlink:type="simple"/><mml:math display="block" id="M8"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>N</mml:mi> <mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:mo>=</mml:mo> <mml:mi>V</mml:mi> <mml:mi>a</mml:mi> <mml:mi>r</mml:mi> <mml:mrow><mml:mo>{</mml:mo> <mml:msub><mml:mi>δ</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>}</mml:mo></mml:mrow> <mml:mo>/</mml:mo> <mml:mi>V</mml:mi> <mml:mi>a</mml:mi> <mml:mi>r</mml:mi> <mml:mrow><mml:mo>{</mml:mo> <mml:msub><mml:mi>Y</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>}</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(2)</label></disp-formula> <disp-formula id="pone.0205219.e009"><alternatives><graphic id="pone.0205219.e009g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e009" xlink:type="simple"/><mml:math display="block" id="M9"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>S</mml:mi> <mml:mi>N</mml:mi> <mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:mo>=</mml:mo> <mml:mi>V</mml:mi> <mml:mi>a</mml:mi> <mml:mi>r</mml:mi> <mml:mrow><mml:mo>{</mml:mo> <mml:msub><mml:mi>D</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>}</mml:mo></mml:mrow> <mml:mo>/</mml:mo> <mml:mi>V</mml:mi> <mml:mi>a</mml:mi> <mml:mi>r</mml:mi> <mml:mrow><mml:mo>{</mml:mo> <mml:msub><mml:mi>δ</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>}</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(3)</label></disp-formula></p>
<p>MNF is the set of linear transformation (<italic>Y</italic><sub><italic>MNF</italic></sub>)<sub><italic>i</italic></sub> = <italic>Yϕ</italic><sub><italic>i</italic></sub>, for <italic>i</italic> = 1, …, <italic>S</italic>, such that the SNR for (<italic>Y</italic><sub><italic>MNF</italic></sub>)<sub><italic>i</italic></sub> is maximum among all linear transformations orthogonal to (<italic>Y</italic><sub><italic>MNF</italic></sub>)<sub><italic>j</italic></sub>, for <italic>j</italic> = <italic>i</italic> + 1, …, <italic>S</italic>. All the transformation vectors in MNF space follow <inline-formula id="pone.0205219.e010"><alternatives><graphic id="pone.0205219.e010g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e010" xlink:type="simple"/><mml:math display="inline" id="M10"><mml:mrow><mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>Y</mml:mi></mml:msub> <mml:msub><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi></mml:msub> <mml:mo>=</mml:mo> <mml:mn>1</mml:mn> <mml:mo>,</mml:mo> <mml:mo>∀</mml:mo> <mml:mi>i</mml:mi> <mml:mo>=</mml:mo> <mml:mrow><mml:mo>[</mml:mo> <mml:mn>1</mml:mn> <mml:mo>:</mml:mo> <mml:mi>S</mml:mi> <mml:mo>]</mml:mo></mml:mrow></mml:mrow></mml:math></alternatives></inline-formula>. Maximization of the noise fraction leads to a numbering of bands that gives decreasing image quality with increasing component number. The SNR for (<italic>Y</italic><sub><italic>MNF</italic></sub>)<sub><italic>i</italic></sub> in MNF space can be formulated:
<disp-formula id="pone.0205219.e011"><alternatives><graphic id="pone.0205219.e011g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e011" xlink:type="simple"/><mml:math display="block" id="M11"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mfrac><mml:mrow><mml:mi>V</mml:mi> <mml:mi>a</mml:mi> <mml:mi>r</mml:mi> <mml:mo>{</mml:mo> <mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:mi>D</mml:mi> <mml:mo>}</mml:mo></mml:mrow> <mml:mrow><mml:mi>V</mml:mi> <mml:mi>a</mml:mi> <mml:mi>r</mml:mi> <mml:mo>{</mml:mo> <mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:mi>δ</mml:mi> <mml:mo>}</mml:mo></mml:mrow></mml:mfrac> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>D</mml:mi></mml:msub> <mml:msub><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi></mml:msub></mml:mrow> <mml:mrow><mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>δ</mml:mi></mml:msub> <mml:msub><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfrac> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>Y</mml:mi></mml:msub> <mml:msub><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi></mml:msub></mml:mrow> <mml:mrow><mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>δ</mml:mi></mml:msub> <mml:msub><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfrac> <mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>=</mml:mo> <mml:msub><mml:mo>λ</mml:mo> <mml:mi>i</mml:mi></mml:msub> <mml:mo>-</mml:mo> <mml:mn>1</mml:mn></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(4)</label></disp-formula></p>
<p>The Noise fraction itself can then be re-factored as follows:
<disp-formula id="pone.0205219.e012"><alternatives><graphic id="pone.0205219.e012g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e012" xlink:type="simple"/><mml:math display="block" id="M12"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mfrac><mml:mrow><mml:mi>V</mml:mi> <mml:mi>a</mml:mi> <mml:mi>r</mml:mi> <mml:mo>{</mml:mo> <mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:mi>δ</mml:mi> <mml:mo>}</mml:mo></mml:mrow> <mml:mrow><mml:mi>V</mml:mi> <mml:mi>a</mml:mi> <mml:mi>r</mml:mi> <mml:mo>{</mml:mo> <mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:mi>Y</mml:mi> <mml:mo>}</mml:mo></mml:mrow></mml:mfrac> <mml:mo>=</mml:mo> <mml:mfrac><mml:mrow><mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>δ</mml:mi></mml:msub> <mml:msub><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi></mml:msub></mml:mrow> <mml:mrow><mml:msubsup><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi> <mml:mi>T</mml:mi></mml:msubsup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>Y</mml:mi></mml:msub> <mml:msub><mml:mi>ϕ</mml:mi> <mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfrac> <mml:mo>=</mml:mo> <mml:mfrac><mml:mn>1</mml:mn> <mml:msub><mml:mo>λ</mml:mo> <mml:mi>i</mml:mi></mml:msub></mml:mfrac></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(5)</label></disp-formula></p>
<p>The vectors <italic>ϕ</italic><sub><italic>i</italic></sub> are thus the real, symmetric eigenvectors of the eigenvalue problem:
<disp-formula id="pone.0205219.e013"><alternatives><graphic id="pone.0205219.e013g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e013" xlink:type="simple"/><mml:math display="block" id="M13"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="right"><mml:mrow><mml:mi>d</mml:mi> <mml:mi>e</mml:mi> <mml:mi>t</mml:mi><mml:mo>{</mml:mo> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>Y</mml:mi></mml:msub> <mml:msubsup><mml:mo>Σ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn></mml:mrow></mml:msubsup> <mml:mo>-</mml:mo> <mml:mo>λ</mml:mo> <mml:mi>I</mml:mi> <mml:mo>}</mml:mo> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(6)</label></disp-formula></p>
<p>Hence <italic>ϕ</italic><sub><italic>i</italic></sub> are the eigenvectors of <inline-formula id="pone.0205219.e014"><alternatives><graphic id="pone.0205219.e014g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e014" xlink:type="simple"/><mml:math display="inline" id="M14"><mml:mrow><mml:msub><mml:mo>Σ</mml:mo> <mml:mi>Y</mml:mi></mml:msub> <mml:msubsup><mml:mo>Σ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn></mml:mrow></mml:msubsup></mml:mrow></mml:math></alternatives></inline-formula>, and λ<sub><italic>i</italic></sub>, eigenvalue corresponding to <italic>ϕ</italic><sub><italic>i</italic></sub>, equals to the noise fraction in (<italic>Y</italic><sub><italic>MNF</italic></sub>)<sub><italic>i</italic></sub>. Also, λ<sub>1</sub> ≥ λ<sub>2</sub> ≥ … ≥ λ<sub><italic>S</italic></sub>, so that the components show decreasing image quality. Thus SNR is given by λ<sub><italic>i</italic></sub> − 1.</p>
</sec>
<sec id="sec007">
<title>Geometric interpretation</title>
<p>As the data <italic>D</italic> and noise <italic>δ</italic> are additive and uncorrelated, we can write:
<disp-formula id="pone.0205219.e015"><alternatives><graphic id="pone.0205219.e015g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e015" xlink:type="simple"/><mml:math display="block" id="M15"><mml:mtable columnalign="left"><mml:mtr columnalign="left"><mml:mtd columnalign="left"><mml:mi>Y</mml:mi></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:mi>D</mml:mi><mml:mo>+</mml:mo><mml:mi>δ</mml:mi></mml:mrow></mml:mtd></mml:mtr><mml:mtr columnalign="left"><mml:mtd columnalign="left"><mml:mrow><mml:msub><mml:mo>Σ</mml:mo><mml:mi>Y</mml:mi></mml:msub></mml:mrow></mml:mtd><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo><mml:msub><mml:mo>Σ</mml:mo><mml:mi>D</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mo>Σ</mml:mo><mml:mi>δ</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(7)</label></disp-formula></p>
<p>Let the spectral decomposition of Σ<sub><italic>δ</italic></sub> be Σ<sub><italic>δ</italic></sub> = <italic>E</italic>Λ<sub><italic>δ</italic></sub> <italic>E</italic><sup><italic>T</italic></sup>. Rotating Σ<sub><italic>Y</italic></sub> in <xref ref-type="disp-formula" rid="pone.0205219.e015">Eq 7</xref> with eigenvector matrix <italic>E</italic> and rescaling it using the inverse-square root of the noise singular values Λ<sub><italic>δ</italic></sub>, results in new covariance matrix where the contribution of noise component has been turned into an identity matrix.
<disp-formula id="pone.0205219.e016"><alternatives><graphic id="pone.0205219.e016g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e016" xlink:type="simple"/><mml:math display="block" id="M16"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="left"><mml:msub><mml:mo>Σ</mml:mo> <mml:mi>W</mml:mi></mml:msub></mml:mtd> <mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>T</mml:mi></mml:msup> <mml:msup><mml:mi>E</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>Y</mml:mi></mml:msub> <mml:mi>E</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>T</mml:mi></mml:msup> <mml:msup><mml:mi>E</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>D</mml:mi></mml:msub> <mml:mi>E</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>+</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>T</mml:mi></mml:msup> <mml:msup><mml:mi>E</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>δ</mml:mi></mml:msub> <mml:mi>E</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:msub><mml:mo>Σ</mml:mo> <mml:mrow><mml:mi>W</mml:mi> <mml:mo>(</mml:mo> <mml:mi>D</mml:mi> <mml:mo>)</mml:mo></mml:mrow></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>I</mml:mi> <mml:mi>δ</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(8)</label></disp-formula></p>
<p>Let the eigen decomposition of Σ<sub><italic>W</italic></sub> be Σ<sub><italic>W</italic></sub> = <italic>G</italic>Λ<sub><italic>MNF</italic></sub> <italic>G</italic><sup><italic>T</italic></sup>. Rotating Σ<sub><italic>W</italic></sub> in <xref ref-type="disp-formula" rid="pone.0205219.e016">Eq 8</xref> with eigenvector matrix <italic>G</italic> results in:
<disp-formula id="pone.0205219.e017"><alternatives><graphic id="pone.0205219.e017g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e017" xlink:type="simple"/><mml:math display="block" id="M17"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="left"><mml:msub><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>M</mml:mi> <mml:mi>N</mml:mi> <mml:mi>F</mml:mi></mml:mrow></mml:msub></mml:mtd> <mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:msup><mml:mi>G</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>W</mml:mi></mml:msub> <mml:mi>G</mml:mi></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:msup><mml:mi>G</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:msub><mml:mo>Σ</mml:mo> <mml:mrow><mml:mi>W</mml:mi> <mml:mo>(</mml:mo> <mml:mi>D</mml:mi> <mml:mo>)</mml:mo></mml:mrow></mml:msub> <mml:mi>G</mml:mi> <mml:mo>+</mml:mo> <mml:msup><mml:mi>G</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:msub><mml:mi>I</mml:mi> <mml:mi>δ</mml:mi></mml:msub> <mml:mi>G</mml:mi></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:msub><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>W</mml:mi> <mml:mo>(</mml:mo> <mml:mi>D</mml:mi> <mml:mo>)</mml:mo></mml:mrow></mml:msub> <mml:mo>+</mml:mo> <mml:msub><mml:mi>I</mml:mi> <mml:mi>δ</mml:mi></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives> <label>(9)</label></disp-formula></p>
<p>The series of transforms that we used to change the original data covariance matrix Σ<sub><italic>Y</italic></sub> into Λ<sub><italic>MNF</italic></sub> is given by the transformation vector <inline-formula id="pone.0205219.e018"><alternatives><graphic id="pone.0205219.e018g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e018" xlink:type="simple"/><mml:math display="inline" id="M18"><mml:mrow><mml:mo>Φ</mml:mo> <mml:mo>=</mml:mo> <mml:mi>E</mml:mi> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mi>G</mml:mi></mml:mrow></mml:math></alternatives></inline-formula> which we call the MNF projection vectors and Λ<sub><italic>MNF</italic></sub> estimates of SNR of the data.</p>
</sec>
<sec id="sec008">
<title>Optimizing MNF</title>
<p>Expanding the entire MNF transform, we can infer the following:
<disp-formula id="pone.0205219.e019"><alternatives><graphic id="pone.0205219.e019g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e019" xlink:type="simple"/><mml:math display="block" id="M19"><mml:mtable displaystyle="true"><mml:mtr><mml:mtd columnalign="left"><mml:mi>D</mml:mi></mml:mtd> <mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>*</mml:mo> <mml:mo>Φ</mml:mo> <mml:mo>*</mml:mo> <mml:mi>R</mml:mi> <mml:mo>*</mml:mo> <mml:msup><mml:mo>Φ</mml:mo> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>*</mml:mo> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>E</mml:mi> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:mi>G</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>*</mml:mo> <mml:mi>R</mml:mi> <mml:mo>*</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:mi>E</mml:mi> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:mi>G</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>*</mml:mo> <mml:mi>E</mml:mi> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:mi>G</mml:mi> <mml:mo>*</mml:mo> <mml:mi>R</mml:mi> <mml:mo>*</mml:mo> <mml:msup><mml:mi>G</mml:mi> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn></mml:mrow></mml:msup> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:msup><mml:mi>E</mml:mi> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>*</mml:mo> <mml:mi>E</mml:mi> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:mi>G</mml:mi> <mml:mo>*</mml:mo> <mml:mi>R</mml:mi> <mml:mo>*</mml:mo> <mml:msup><mml:mi>G</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:msup><mml:mi>E</mml:mi> <mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>*</mml:mo> <mml:mi>E</mml:mi> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:mi>G</mml:mi> <mml:mo>*</mml:mo> <mml:mi>R</mml:mi> <mml:mo>*</mml:mo> <mml:msup><mml:mi>R</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mo>*</mml:mo> <mml:msup><mml:mi>G</mml:mi> <mml:mi>T</mml:mi></mml:msup> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:msup><mml:mi>E</mml:mi> <mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>*</mml:mo> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>E</mml:mi> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:mi>G</mml:mi> <mml:mo>*</mml:mo> <mml:mi>R</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>*</mml:mo> <mml:msup><mml:mrow><mml:mo>(</mml:mo> <mml:mi>E</mml:mi> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:mi>G</mml:mi> <mml:mo>*</mml:mo> <mml:mi>R</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd/><mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:mi>Y</mml:mi> <mml:mo>*</mml:mo> <mml:mover accent="true"><mml:mo>Φ</mml:mo> <mml:mo>^</mml:mo></mml:mover> <mml:mo>*</mml:mo> <mml:msup><mml:mover accent="true"><mml:mo>Φ</mml:mo> <mml:mo>˜</mml:mo></mml:mover> <mml:mi>T</mml:mi></mml:msup></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd columnalign="left"><mml:mrow><mml:mo>⇒</mml:mo> <mml:mover accent="true"><mml:mo>Φ</mml:mo> <mml:mo>^</mml:mo></mml:mover></mml:mrow></mml:mtd> <mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:mi>E</mml:mi> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mo>-</mml:mo> <mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:mi>G</mml:mi> <mml:mo>*</mml:mo> <mml:mi>R</mml:mi> <mml:mspace width="2.em"/><mml:mo>/</mml:mo> <mml:mo>/</mml:mo> <mml:mtext>forward</mml:mtext><mml:mspace width="4pt"/><mml:mtext>MNF</mml:mtext><mml:mspace width="4pt"/><mml:mtext>transform</mml:mtext></mml:mrow></mml:mtd></mml:mtr> <mml:mtr><mml:mtd columnalign="left"><mml:mrow><mml:mo>⇒</mml:mo> <mml:mover accent="true"><mml:mo>Φ</mml:mo> <mml:mo>˜</mml:mo></mml:mover></mml:mrow></mml:mtd> <mml:mtd columnalign="left"><mml:mrow><mml:mo>=</mml:mo> <mml:mi>E</mml:mi> <mml:mo>*</mml:mo> <mml:msubsup><mml:mo>Λ</mml:mo> <mml:mrow><mml:mi>δ</mml:mi></mml:mrow> <mml:mrow><mml:mn>1</mml:mn> <mml:mo>/</mml:mo> <mml:mn>2</mml:mn></mml:mrow></mml:msubsup> <mml:mo>*</mml:mo> <mml:mi>G</mml:mi> <mml:mo>*</mml:mo> <mml:mi>R</mml:mi> <mml:mspace width="2.em"/><mml:mo>/</mml:mo> <mml:mo>/</mml:mo> <mml:mtext>inverse</mml:mtext><mml:mspace width="4pt"/><mml:mtext>MNF</mml:mtext><mml:mspace width="4pt"/><mml:mtext>transform</mml:mtext></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></alternatives></disp-formula></p>
<p>Since <italic>R</italic> is a block identity matrix <inline-formula id="pone.0205219.e020"><alternatives><graphic id="pone.0205219.e020g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e020" xlink:type="simple"/><mml:math display="inline" id="M20"><mml:mrow><mml:mi>R</mml:mi> <mml:mo>=</mml:mo> <mml:mo>[</mml:mo> <mml:mtable><mml:mtr><mml:mtd><mml:msub><mml:mi>I</mml:mi> <mml:mi>K</mml:mi></mml:msub></mml:mtd> <mml:mtd><mml:mn>0</mml:mn></mml:mtd></mml:mtr> <mml:mtr><mml:mtd><mml:mn>0</mml:mn></mml:mtd> <mml:mtd><mml:mn>0</mml:mn></mml:mtd></mml:mtr></mml:mtable> <mml:mo>]</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>, introducing an extra <italic>R</italic><sup><italic>T</italic></sup> term keeps the value of the expression unaltered as <italic>R</italic> * <italic>R</italic><sup><italic>T</italic></sup> = <italic>R</italic>. Writing the MNF transform in this way, we ensure that we skip the costly matrix inversions of the MNF vectors. Also <italic>G</italic> * <italic>R</italic> is effectively choosing the top <italic>K</italic> eigenvalues of <italic>G</italic>. Therefore we can reduce the computation cost by finding the reduced rank-<italic>K</italic> SVD of Σ<sub><italic>Y</italic></sub>. The Λ<sub><italic>δ</italic></sub> matrix inversion can also be replaced by more efficient versions due to its diagonal structure.</p>
</sec>
<sec id="sec009">
<title>Automatic band selection</title>
<p>The optimal value of <italic>K</italic> can be determined by inspecting the entries of Λ<sub><italic>MNF</italic></sub> = <italic>SNR</italic> + 1 which is a diagonal matrix. The Rose criteria [<xref ref-type="bibr" rid="pone.0205219.ref022">22</xref>] states that an SNR of at least 5.0 is needed to be able to distinguish image features at 100% certainty. We select the top <italic>K</italic> bands in the MNF space for which <italic>SNR</italic> = Λ<sub><italic>MNF</italic></sub> − 1 ≥ 5.0. Automating this process is the main computational speed factor that brings down the processing time from days down to a few hours.</p>
</sec>
<sec id="sec010">
<title>Fast MNF</title>
<p>By exploiting the MNF formulation (<italic>sec</italic>. Optimizing MNF), we can avoid all inverse operations and replace them with transpose, thereby making computations faster. Owing to the symmetric structure of covariance matrices, we also compute the singular value decomposition using eigen decomposition which is faster. Also, the transformation matrices are of size (<italic>S</italic> × <italic>K</italic>) instead of (<italic>S</italic> × <italic>S</italic>) where <italic>K</italic> ≪ <italic>S</italic>. This is the main factor responsible for the algorithmic speedup.</p>
</sec>
<sec id="sec011">
<title>Approx MNF</title>
<p>Since <italic>K</italic> ≪ <italic>S</italic>, it is inefficient to compute the full spectral decomposition of the covariance matrix. Empirically, it was observed over different datasets, that the optimal value of the automatically selected <italic>K</italic> is 2 − 3% of the total number of bands <italic>S</italic>. Hence we compute only a rank <inline-formula id="pone.0205219.e021"><alternatives><graphic id="pone.0205219.e021g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e021" xlink:type="simple"/><mml:math display="inline" id="M21"><mml:mover accent="true"><mml:mi>K</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula> truncated SVD of the whitened covariance matrix. This results in reduced computation time as well as memory. The standard solutions to truncated SVD include the power iteration algorithm and the Krylov subspace methods. Since power iteration is unstable at times due to the structure of the singular values, we use a version of the Block Lanczos method [<xref ref-type="bibr" rid="pone.0205219.ref023">23</xref>]. We set <inline-formula id="pone.0205219.e022"><alternatives><graphic id="pone.0205219.e022g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e022" xlink:type="simple"/><mml:math display="inline" id="M22"><mml:mrow><mml:mover accent="true"><mml:mi>K</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mo>=</mml:mo> <mml:mn>0</mml:mn> <mml:mo>.</mml:mo> <mml:mn>03</mml:mn> <mml:mo>×</mml:mo> <mml:mi>S</mml:mi></mml:mrow></mml:math></alternatives></inline-formula> and compute the rank <inline-formula id="pone.0205219.e023"><alternatives><graphic id="pone.0205219.e023g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e023" xlink:type="simple"/><mml:math display="inline" id="M23"><mml:mover accent="true"><mml:mi>K</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula>-SVD, then let the band selection criteria to decide the optimal <italic>K</italic>.</p>
</sec>
<sec id="sec012">
<title>Rand MNF</title>
<p>Although the block Lanczos algorithm can attain machine precision, it inevitably goes many passes through Σ<sub><italic>W</italic></sub>, and it is thus slow when Σ<sub><italic>W</italic></sub> is large or does not fit in memory. To circumvent this scenario, we use a faster randomized and memory efficient version which computes the <inline-formula id="pone.0205219.e024"><alternatives><graphic id="pone.0205219.e024g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e024" xlink:type="simple"/><mml:math display="inline" id="M24"><mml:mover accent="true"><mml:mi>K</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula>-SVD of Σ<sub><italic>W</italic></sub> up to 1+ <italic>ϵ</italic> Frobenius norm relative error [<xref ref-type="bibr" rid="pone.0205219.ref024">24</xref>].</p>
</sec>
<sec id="sec013">
<title>Error metric</title>
<p>In the absence of ground truth images of denoised data, we use a non-reference image quality metric this is simple and easy to use. The Method Noise Image (MNI) [<xref ref-type="bibr" rid="pone.0205219.ref025">25</xref>] metric aims at maximizing the structure similarity between the input noisy image and the estimated image noise around homogeneous regions and the structure similarity between the input noisy image and the denoised image around highly-structured regions, and is computed as the linear correlation coefficient of the two corresponding structure similarity maps.</p>
</sec>
</sec>
<sec id="sec014" sec-type="results">
<title>Results</title>
<sec id="sec015">
<title>Setup</title>
<p>For all the experimentation, a standalone machine with Intel Xeon <italic>E</italic>5 − 1660@3.20GHz CPU and 64GB of RAM was used. Software for the simulations, results and plots include Matlab and ENVI.</p>
</sec>
<sec id="sec016">
<title>Complexity analysis</title>
<p>
<xref ref-type="table" rid="pone.0205219.t001">Table 1</xref> shows the algorithmic time and space complexity in terms of memory usage for the different MNF versions. The best algorithm in terms of time-space-accuracy is Approx MNF. This is because it computes the best rank-K SVD with little loss in its approximation or memory usage. Depending on how much one wants a memory-accuracy trade-off, one may choose to switch to use Rand MNF, as it is a randomized version with approximation error guided by its parameters. For a typical FTIR spectrum with <italic>S</italic> ∼ 1500 bands, the algorithm estimated the optimal number of bands to be <italic>K</italic> ∼ 30, resulting in an efficiency factor of 50×.</p>
<table-wrap id="pone.0205219.t001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0205219.t001</object-id>
<label>Table 1</label>
<caption>
<title>Comparison of time and space complexity of MNF versions.</title>
<p>
<inline-formula id="pone.0205219.e025">
<alternatives>
<graphic id="pone.0205219.e025g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e025" xlink:type="simple"/>
<mml:math display="inline" id="M25">
<mml:mi mathvariant="script">O</mml:mi>
</mml:math>
</alternatives>
</inline-formula>: big-O complexity. <italic>nnz</italic>(<italic>X</italic>): # non-zero elements in <italic>X</italic>. <italic>N</italic>: # pixels, <italic>S</italic>: # spectral bands and <italic>K</italic>: # chosen bands.</p>
</caption>
<alternatives>
<graphic id="pone.0205219.t001g" mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0205219.t001" xlink:type="simple"/>
<table border="0" frame="box" rules="all">
<colgroup>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
<col align="left" valign="middle"/>
</colgroup>
<thead>
<tr>
<th align="left" style="border-bottom:thick">Algorithm</th>
<th align="right" style="border-bottom:thick">Time</th>
<th align="right" style="border-bottom:thick">Space</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left">1. MNF</td>
<td align="right">
<inline-formula id="pone.0205219.e026">
<alternatives>
<graphic id="pone.0205219.e026g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e026" xlink:type="simple"/>
<mml:math display="inline" id="M26">
<mml:mrow>
<mml:mi mathvariant="script">O</mml:mi>
<mml:mo>(</mml:mo>
<mml:msup>
<mml:mi>S</mml:mi>
<mml:mn>3</mml:mn>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mi>N</mml:mi>
<mml:msup>
<mml:mi>S</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</alternatives>
</inline-formula>
</td>
<td align="right">
<inline-formula id="pone.0205219.e027">
<alternatives>
<graphic id="pone.0205219.e027g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e027" xlink:type="simple"/>
<mml:math display="inline" id="M27">
<mml:mrow>
<mml:mi mathvariant="script">O</mml:mi>
<mml:mo>(</mml:mo>
<mml:mi>N</mml:mi>
<mml:mi>S</mml:mi>
<mml:mo>+</mml:mo>
<mml:msup>
<mml:mi>S</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</alternatives>
</inline-formula>
</td>
</tr>
<tr>
<td align="left">2. Fast MNF</td>
<td align="right">
<inline-formula id="pone.0205219.e028">
<alternatives>
<graphic id="pone.0205219.e028g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e028" xlink:type="simple"/>
<mml:math display="inline" id="M28">
<mml:mrow>
<mml:mi mathvariant="script">O</mml:mi>
<mml:mo>(</mml:mo>
<mml:msup>
<mml:mi>S</mml:mi>
<mml:mn>3</mml:mn>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mi>N</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>K</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</alternatives>
</inline-formula>
</td>
<td align="right">
<inline-formula id="pone.0205219.e029">
<alternatives>
<graphic id="pone.0205219.e029g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e029" xlink:type="simple"/>
<mml:math display="inline" id="M29">
<mml:mrow>
<mml:mi mathvariant="script">O</mml:mi>
<mml:mo>(</mml:mo>
<mml:mi>N</mml:mi>
<mml:mi>K</mml:mi>
<mml:mo>+</mml:mo>
<mml:msup>
<mml:mi>S</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</alternatives>
</inline-formula>
</td>
</tr>
<tr>
<td align="left">3. Approx MNF</td>
<td align="right">
<inline-formula id="pone.0205219.e030">
<alternatives>
<graphic id="pone.0205219.e030g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e030" xlink:type="simple"/>
<mml:math display="inline" id="M30">
<mml:mrow>
<mml:mi mathvariant="script">O</mml:mi>
<mml:mo>(</mml:mo>
<mml:msup>
<mml:mi>S</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mi>K</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>N</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>K</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</alternatives>
</inline-formula>
</td>
<td align="right">
<inline-formula id="pone.0205219.e031">
<alternatives>
<graphic id="pone.0205219.e031g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e031" xlink:type="simple"/>
<mml:math display="inline" id="M31">
<mml:mrow>
<mml:mi mathvariant="script">O</mml:mi>
<mml:mo>(</mml:mo>
<mml:mi>N</mml:mi>
<mml:mi>K</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>K</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</alternatives>
</inline-formula>
</td>
</tr>
<tr>
<td align="left">4. Rand MNF</td>
<td align="right">
<inline-formula id="pone.0205219.e032">
<alternatives>
<graphic id="pone.0205219.e032g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e032" xlink:type="simple"/>
<mml:math display="inline" id="M32">
<mml:mrow>
<mml:mi mathvariant="script">O</mml:mi>
<mml:mo>(</mml:mo>
<mml:mi>n</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>z</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mo>Σ</mml:mo>
<mml:mi>W</mml:mi>
</mml:msub>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mi>K</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>N</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>K</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</alternatives>
</inline-formula>
</td>
<td align="right">
<inline-formula id="pone.0205219.e033">
<alternatives>
<graphic id="pone.0205219.e033g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e033" xlink:type="simple"/>
<mml:math display="inline" id="M33">
<mml:mrow>
<mml:mi mathvariant="script">O</mml:mi>
<mml:mo>(</mml:mo>
<mml:mi>N</mml:mi>
<mml:mi>K</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>K</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:math>
</alternatives>
</inline-formula>
</td>
</tr>
</tbody>
</table>
</alternatives>
</table-wrap>
</sec>
<sec id="sec017">
<title>Timing analysis</title>
<p>Standard MNF is worst in terms of time complexity as it computes the full eigen decomposition of Σ<sub><italic>W</italic></sub> <inline-formula id="pone.0205219.e034"><alternatives><graphic id="pone.0205219.e034g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e034" xlink:type="simple"/><mml:math display="inline" id="M34"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msup><mml:mi>S</mml:mi> <mml:mn>3</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> and uses all the <italic>S</italic> eigenvectors to transform the input data into MNF space <inline-formula id="pone.0205219.e035"><alternatives><graphic id="pone.0205219.e035g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e035" xlink:type="simple"/><mml:math display="inline" id="M35"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>N</mml:mi> <mml:msup><mml:mi>S</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. In comparison, Fast MNF still computes the full decomposition of Σ<sub><italic>W</italic></sub> <inline-formula id="pone.0205219.e036"><alternatives><graphic id="pone.0205219.e036g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e036" xlink:type="simple"/><mml:math display="inline" id="M36"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msup><mml:mi>S</mml:mi> <mml:mn>3</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>, but uses the Band selection criteria to retain only the top <italic>K</italic> eigenvalues. Hence only the top <italic>K</italic> eigenvectors are used to transform the data into MNF space <inline-formula id="pone.0205219.e037"><alternatives><graphic id="pone.0205219.e037g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e037" xlink:type="simple"/><mml:math display="inline" id="M37"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mo>(</mml:mo> <mml:mi>N</mml:mi> <mml:mi>S</mml:mi> <mml:mi>K</mml:mi> <mml:mo>)</mml:mo> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. For Approx MNF, we only compute a truncated rank <inline-formula id="pone.0205219.e038"><alternatives><graphic id="pone.0205219.e038g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e038" xlink:type="simple"/><mml:math display="inline" id="M38"><mml:mover accent="true"><mml:mi>K</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula>-SVD of Σ<sub><italic>W</italic></sub>, since it was empirically observed that the top <italic>K</italic> chosen bands lie within <inline-formula id="pone.0205219.e039"><alternatives><graphic id="pone.0205219.e039g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e039" xlink:type="simple"/><mml:math display="inline" id="M39"><mml:mrow><mml:mover accent="true"><mml:mi>K</mml:mi> <mml:mo>^</mml:mo></mml:mover> <mml:mo>=</mml:mo> <mml:mn>2</mml:mn> <mml:mo>-</mml:mo> <mml:mn>3</mml:mn> <mml:mo>%</mml:mo></mml:mrow></mml:math></alternatives></inline-formula> of <italic>S</italic>, thereby highly reducing the computational cost <inline-formula id="pone.0205219.e040"><alternatives><graphic id="pone.0205219.e040g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e040" xlink:type="simple"/><mml:math display="inline" id="M40"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msup><mml:mi>S</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mi>K</mml:mi> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. Again, only the top <italic>K</italic> eigenvectors are used to transform the data into MNF space <inline-formula id="pone.0205219.e041"><alternatives><graphic id="pone.0205219.e041g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e041" xlink:type="simple"/><mml:math display="inline" id="M41"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mo>(</mml:mo> <mml:mi>N</mml:mi> <mml:mi>S</mml:mi> <mml:mi>K</mml:mi> <mml:mo>)</mml:mo> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. Rand MNF uses a randomized algorithm to compute a truncated rank <inline-formula id="pone.0205219.e042"><alternatives><graphic id="pone.0205219.e042g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e042" xlink:type="simple"/><mml:math display="inline" id="M42"><mml:mover accent="true"><mml:mi>K</mml:mi> <mml:mo>^</mml:mo></mml:mover></mml:math></alternatives></inline-formula>-SVD of Σ<sub><italic>W</italic></sub>, hence it is much more efficient in terms of speed <inline-formula id="pone.0205219.e043"><alternatives><graphic id="pone.0205219.e043g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e043" xlink:type="simple"/><mml:math display="inline" id="M43"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:mi>n</mml:mi> <mml:mi>n</mml:mi> <mml:mi>z</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msub><mml:mo>Σ</mml:mo> <mml:mi>W</mml:mi></mml:msub> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>)</mml:mo></mml:mrow> <mml:mi>K</mml:mi> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>, as the values in Σ<sub><italic>W</italic></sub> will only be non-zero for channels which are correlated in terms of signal. Only the top <italic>K</italic> eigenvectors are used to transform the data into MNF space <inline-formula id="pone.0205219.e044"><alternatives><graphic id="pone.0205219.e044g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e044" xlink:type="simple"/><mml:math display="inline" id="M44"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mo>(</mml:mo> <mml:mi>N</mml:mi> <mml:mi>S</mml:mi> <mml:mi>K</mml:mi> <mml:mo>)</mml:mo> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. Refer to <xref ref-type="fig" rid="pone.0205219.g001">Fig 1</xref> for runtime. In all the three variants with <italic>S</italic> ∼ 1500 and <italic>K</italic> ∼ 30, the algorithmic scaling of <italic>SK</italic> instead of <italic>S</italic><sup>2</sup> reduces runtime by ∼ 50×. For the BR1003 data, the entire MNF denoising process was reduced from ∼ 1 month to ∼ 2 hours. This clearly shows that the larger the data size, the better is the scaling of the proposed algorithms, thereby massively reducing the computational time of denoising for large TMA and associated datasets.</p>
<fig id="pone.0205219.g001" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0205219.g001</object-id>
<label>Fig 1</label>
<caption>
<title>Runtime comparison of different implementations of MNF.</title>
<p>The figure illustrates how time scales with varying size of the input data for proposed versions and optimizations of the standard MNF. The size is varied from 10<italic>K</italic> pixels (100 × 100) to 1000<italic>K</italic> pixels (1000 × 1000). Compared to the standard MNF, all the other versions have a speedup factor of ∼ 10. This speedup is obtained by utilizing the fact that we do not need all the forward MNF vectors, but only the top <italic>K</italic> ones that are digitally calculated, avoiding manual selection. Also, a set of optimized matrix operations have been implemented, for instance replacing all inverse operations with transpose for improved computational performance. Due to BLAS optimized modules in Matlab, matrix multiplications are efficiently distributed across the cores automatically. Note: The standard MNF runtime includes automatic band selection.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0205219.g001" xlink:type="simple"/>
</fig>
<p><bold>Note:</bold> Since the structure of the noise is unknown, we cannot instinctively perform the rank-<italic>K</italic> approximation of Σ<sub><italic>δ</italic></sub>, because depending on experiment and instrument there is no guarantee on the strength of noise present in the raw data. For this reason, in the first step of eigen decomposition, we choose to retain bands which accounts for 99% variance in the noise bands. This further reduces the computational time of the process (∼ 3× extra speedup).</p>
</sec>
<sec id="sec018">
<title>Space analysis</title>
<p>Standard MNF computes the full SVD decomposition <inline-formula id="pone.0205219.e045"><alternatives><graphic id="pone.0205219.e045g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e045" xlink:type="simple"/><mml:math display="inline" id="M45"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msup><mml:mi>S</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. The transformed data in MNF space contains all <italic>S</italic> bands <inline-formula id="pone.0205219.e046"><alternatives><graphic id="pone.0205219.e046g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e046" xlink:type="simple"/><mml:math display="inline" id="M46"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mo>(</mml:mo> <mml:mi>N</mml:mi> <mml:mi>S</mml:mi> <mml:mo>)</mml:mo> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. Fast MNF again does the full SVD decomposition <inline-formula id="pone.0205219.e047"><alternatives><graphic id="pone.0205219.e047g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e047" xlink:type="simple"/><mml:math display="inline" id="M47"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mrow><mml:mo>(</mml:mo> <mml:msup><mml:mi>S</mml:mi> <mml:mn>2</mml:mn></mml:msup> <mml:mo>)</mml:mo></mml:mrow> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. However the data in transformed domain only contain <italic>K</italic> bands <inline-formula id="pone.0205219.e048"><alternatives><graphic id="pone.0205219.e048g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e048" xlink:type="simple"/><mml:math display="inline" id="M48"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mo>(</mml:mo> <mml:mi>N</mml:mi> <mml:mi>K</mml:mi> <mml:mo>)</mml:mo> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. Both Approx MNF and Rand MNF compute the truncated rank <italic>K</italic> decomposition, hence there are <italic>K</italic> eigenvectors each of <italic>S</italic> dimension <inline-formula id="pone.0205219.e049"><alternatives><graphic id="pone.0205219.e049g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e049" xlink:type="simple"/><mml:math display="inline" id="M49"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mo>(</mml:mo> <mml:mi>S</mml:mi> <mml:mi>K</mml:mi> <mml:mo>)</mml:mo> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. The data in the transformed domain contains only <italic>K</italic> bands <inline-formula id="pone.0205219.e050"><alternatives><graphic id="pone.0205219.e050g" mimetype="image" position="anchor" xlink:href="info:doi/10.1371/journal.pone.0205219.e050" xlink:type="simple"/><mml:math display="inline" id="M50"><mml:mrow><mml:mo>(</mml:mo> <mml:mi mathvariant="script">O</mml:mi> <mml:mo>(</mml:mo> <mml:mi>N</mml:mi> <mml:mi>K</mml:mi> <mml:mo>)</mml:mo> <mml:mo>)</mml:mo></mml:mrow></mml:math></alternatives></inline-formula>. For the FTIR data with <italic>S</italic> ∼ 1500 bands and <italic>K</italic> ∼ 30, we achieve a RAM space saving of ∼ 50×, allowing us to process more data simultaneously in one go.</p>
</sec>
<sec id="sec019">
<title>Denoising profiles</title>
<p>The improvements offered by the different versions of the MNF presented in this study are illustrated in <xref ref-type="fig" rid="pone.0205219.g002">Fig 2</xref>. The extent of denoising both in the spectral and spatial domain is approximately the same for all the different MNF algorithms. <xref ref-type="fig" rid="pone.0205219.g002">Fig 2A</xref>. depicts the spatial detail offered by different MNF versions with zoomed in sections in <xref ref-type="fig" rid="pone.0205219.g002">Fig 2C and 2B</xref>. shows the horizontal signal profile across the sample. Next, spectral profiles are compared across the different algorithms with reference spectrum (without MNF) to illustrate the extent of noise removal in each case (<xref ref-type="fig" rid="pone.0205219.g002">Fig 2D</xref>). It can be seen that even with a speed up factor of ∼ 10 there is no significant reduction in the spectral and spatial image quality.</p>
<fig id="pone.0205219.g002" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0205219.g002</object-id>
<label>Fig 2</label>
<caption>
<title/>
<p>Spectral and SNR comparisons: A. IR image of a patient case at amide 1 band. B: Intensity profile along the horizontal line in the cases shown in A spanning the entire core for both the noisy and the denoised (in gray) version. C. Zoomed in view of the area marked with a red box in top row. D. Comparison of the spectral profile of the noisy and the MNF version at the pixel marked in red in C.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0205219.g002" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec020">
<title>Error metric</title>
<p>Along with evaluating the performance of the presented MNF versions by examining the tissue profile, we utilize the MNI (method noise image) metric [<xref ref-type="bibr" rid="pone.0205219.ref025">25</xref>] aiming to maximize the structural similarity between the input noisy image and the denoised image around highly-structured regions, in the absence of ground truth. <xref ref-type="fig" rid="pone.0205219.g003">Fig 3</xref> shows the metric values for a core, over all the 1506 bands. A lower value of MNI indicate better denoising and structure preservation. This is evident from the fingerprint region (900 − 1800<italic>cm</italic><sup>−1</sup>) which has very low values of MNI, while it is higher for the IR silent region (1800 − 2700<italic>cm</italic><sup>−1</sup>). Since Standard MNF, Fast MNF and Approx MNF are almost the same in terms of reconstruction accuracy, all the plots from those three methods are same. The Rand MNF method which has a space-accuracy trade-off, produces similar results but with slight variations in most bands (notice the wavering in the plot).</p>
<fig id="pone.0205219.g003" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0205219.g003</object-id>
<label>Fig 3</label>
<caption>
<title>MNI metric plot for a breast tissue biopsy.</title>
<p>Lower values of MNI indicate better denoising and perseverance of structure. Across all the four variations we notice low values of MNI in the fingerprint region (900 − 1800<italic>cm</italic><sup>−1</sup>), which is mainly responsible for tissue classification. This shows that even in the presence of noise, the subtle structural features of the tissues are preserved after denoising. High MNI values in the IR silent region (1800 − 2700<italic>cm</italic><sup>−1</sup>) are expected as they mainly contain noise and no relevant signal components. The functional region (2700 − 3600<italic>cm</italic><sup>−1</sup>) has low MNI again followed by high MNI values in the water vapor absorption bands (3600 − 3800<italic>cm</italic><sup>−1</sup>).</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0205219.g003" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec021">
<title>Visualizing MNF bands</title>
<p>
<xref ref-type="fig" rid="pone.0205219.g004">Fig 4</xref> visualizes the top <italic>K</italic> eigenimages (where <italic>K</italic> is automatically determined by the selection criteria) for two different patient cases (core1 and core 2). The bands in MNF space are arranged in decreasing order of SNR (increasing order of noise fraction), resulting in decreasing image quality with increase in band number. This suggests that the eigenimages in MNF space have decreasing image quality in terms of both the noise and structural detail. So, a few top bands in the MNF space should be able to capture most of information represented in the data along with denoising. This concept can further be utilized to develop automated selection criteria for the number of bands to be kept after the transform. This can help eliminate user based subjectivity, make the process faster and easier to implement.</p>
<fig id="pone.0205219.g004" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0205219.g004</object-id>
<label>Fig 4</label>
<caption>
<title>Eigenimages of the top K bands in the MNF space for two given TMA cores.</title>
<p>There is an evident decrease in structural features and SNR with increase in band number. Manually inspecting these eigenimages or defining some measurement metric (Reddy <italic>et al</italic>. [<xref ref-type="bibr" rid="pone.0205219.ref020">20</xref>]) on them, increases the processing time and computation cost for MNF. Our approach automatically determines the optimal value of <italic>K</italic> from the MNF eigenvalues in a computationally efficient manner.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0205219.g004" xlink:type="simple"/>
</fig>
</sec>
<sec id="sec022">
<title>Impact on tissue classification</title>
<p>Furthermore, we studied the effect of MNF based data processing on tissue classification models. In particular we have investigated the performance of different MNF algorithms against raw data for distinguishing cancer from benign breast cells. It can be seen in <xref ref-type="fig" rid="pone.0205219.g005">Fig 5</xref>, that for all the MNF versions, the Area Under Curve (AUC) value of the malignant epithelium (cancer) class is the same and there is a 10% drop in accuracy without the use of MNF. This suggests that for the development of highly accurate and efficient diagnostic models with HSI data, MNF gives better performance. Also, the MNF techniques presented in this paper (Fast MNF, Rand MNF and Approx MNF), offers the same performance as compared to standard MNF with a factor of 60× reduction in the processing time and 50× reduction in memory space required for computation.</p>
<fig id="pone.0205219.g005" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0205219.g005</object-id>
<label>Fig 5</label>
<caption>
<title>Effect of MNF variants on the classification accuracy of a breast tissue biopsy.</title>
<p>A-D. Classified images after standard MNF, fast MNF, Approx MNF and Rand MNF in a clockwise order. E. H&amp;E (Hematoxylin and Eosin) stained image of an adjacent slice of the same tissue. F. Receiver Operating Characteristic (ROC) curve with area under the curve (AUC) values for the malignant epithelium class.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0205219.g005" xlink:type="simple"/>
</fig>
<p>The case shown in <xref ref-type="fig" rid="pone.0205219.g005">Fig 5</xref> belongs to a typical hyperplasia disease state that is known to be correlated with malignant signature but the extent is not well understood. This leads to slight variations in the projections as the some cells may be at the interface of benign and malignant classes. Further to illustrate that the projections are mainly different because of borderline pixels, projections of a benign case is also shown in <xref ref-type="fig" rid="pone.0205219.g006">Fig 6</xref> where the epithelial assignments are similar for all the MNF approximations except at the edges.</p>
<fig id="pone.0205219.g006" position="float">
<object-id pub-id-type="doi">10.1371/journal.pone.0205219.g006</object-id>
<label>Fig 6</label>
<caption>
<title>Effect of MNF variants on the classification accuracy of a benign case of breast tissue biopsy.</title>
<p>A-D. Classified images after standard MNF, fast MNF, Approx MNF and Rand MNF in a clockwise order.</p>
</caption>
<graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0205219.g006" xlink:type="simple"/>
</fig>
</sec>
</sec>
<sec id="sec023" sec-type="conclusions">
<title>Conclusion</title>
<p>In this paper, we demonstrate how to automate the band selection process in the MNF space, which drastically reduces the workflow duration of MNF denoising of TMA’s from almost a month down to a matter of hours. We introduced three different optimizations of the MNF algorithm depending on the speed-memory-accuracy trade-off, resulting in a 60× runtime improvement and 50× memory efficiency. A well established error metric is also used which helps us decide the quality of denoising, in the absence of ground truth images. Similar classification performance of the suggested approaches as compared to conventional techniques suggesting the potential of the developed methods for computationally efficient analysis of big datasets for diagnostic applications. As a future work, we would like to make better approximations of the noise model itself, so that we can apply approximations for the eigen decomposition of the noise covariance matrix, hence further reducing the computational time of the process.</p>
</sec>
<sec id="sec024">
<title>Supporting information</title>
<supplementary-material id="pone.0205219.s001" mimetype="application/zip" position="float" xlink:href="info:doi/10.1371/journal.pone.0205219.s001" xlink:type="simple">
<label>S1 Dataset</label>
<caption>
<title>A small set of the data (S13_noisy.mat) we used for our experiments has been uploaded as a supplementary file.</title>
<p>Also in the supplementary files please find all our matlab code files (S_1_file-S_12_file) (.m).</p>
<p>(ZIP)</p>
</caption>
</supplementary-material>
</sec>
</body>
<back>
<ack>
<p>This research was supported in part by NIH grant R01GM117594.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="pone.0205219.ref001">
<label>1</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Green</surname> <given-names>AA</given-names></name>, <name name-style="western"><surname>Berman</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Switzer</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Craig</surname> <given-names>MD</given-names></name>. <article-title>A transformation for ordering multispectral data in terms of image quality with implications for noise removal</article-title>. <source>Geoscience and Remote Sensing, IEEE Transactions on</source>. <year>1988</year>;<volume>26</volume>(<issue>1</issue>):<fpage>65</fpage>–<lpage>74</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/36.3001" xlink:type="simple">10.1109/36.3001</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0205219.ref002">
<label>2</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bhargava</surname> <given-names>R</given-names></name>. <article-title>Infrared spectroscopic imaging: the next generation</article-title>. <source>Applied spectroscopy</source>. <year>2012</year>;<volume>66</volume>(<issue>10</issue>):<fpage>1091</fpage>–<lpage>1120</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1366/12-06801" xlink:type="simple">10.1366/12-06801</ext-link></comment> <object-id pub-id-type="pmid">23031693</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref003">
<label>3</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Elkins</surname> <given-names>KM</given-names></name>. <article-title>Rapid Presumptive “Fingerprinting” of Body Fluids and Materials by ATR FT-IR Spectroscopy</article-title>. <source>Journal of forensic sciences</source>. <year>2011</year>;<volume>56</volume>(<issue>6</issue>):<fpage>1580</fpage>–<lpage>1587</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/j.1556-4029.2011.01870.x" xlink:type="simple">10.1111/j.1556-4029.2011.01870.x</ext-link></comment> <object-id pub-id-type="pmid">21827466</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref004">
<label>4</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Diem</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Mazur</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Lenau</surname> <given-names>K</given-names></name>, <name name-style="western"><surname>Schubert</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Bird</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Miljković</surname> <given-names>M</given-names></name>, <etal>et al</etal>. <article-title>Molecular pathology via IR and Raman spectral imaging</article-title>. <source>Journal of biophotonics</source>. <year>2013</year>;<volume>6</volume>(<issue>11-12</issue>):<fpage>855</fpage>–<lpage>886</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/jbio.201300131" xlink:type="simple">10.1002/jbio.201300131</ext-link></comment> <object-id pub-id-type="pmid">24311233</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref005">
<label>8</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Görtler</surname> <given-names>J.</given-names></name>, <name name-style="western"><surname>Kayser</surname> <given-names>K.</given-names></name>, <name name-style="western"><surname>Borkenfeld</surname> <given-names>S.</given-names></name>, <name name-style="western"><surname>Carvalho</surname> <given-names>R.</given-names></name>, <name name-style="western"><surname>Kayser</surname> <given-names>G</given-names></name>. <article-title>Congnitive Algorithms and digitized Tissue-based Diagnosis</article-title>. <source>Diagnostic Pathology</source>. <year>2017</year>;<volume>3</volume>:<fpage>248</fpage>.</mixed-citation>
</ref>
<ref id="pone.0205219.ref006">
<label>5</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Mayerich</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Walsh</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Schulmerich</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Bhargava</surname> <given-names>R</given-names></name>. <article-title>Real-time interactive data mining for chemical imaging information: application to automated histopathology</article-title>. <source>BMC bioinformatics</source>. <year>2013</year>;<volume>14</volume>(<issue>1</issue>):<fpage>156</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/1471-2105-14-156" xlink:type="simple">10.1186/1471-2105-14-156</ext-link></comment> <object-id pub-id-type="pmid">23651487</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref007">
<label>6</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Pilling</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Gardner</surname> <given-names>P</given-names></name>. <article-title>Fundamental developments in infrared spectroscopic imaging for biomedical applications</article-title>. <source>Chemical Society reviews</source>. <year>2016</year>;<volume>45</volume>(<issue>7</issue>):<fpage>1935</fpage>–<lpage>1957</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1039/c5cs00846h" xlink:type="simple">10.1039/c5cs00846h</ext-link></comment> <object-id pub-id-type="pmid">26996636</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref008">
<label>7</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lasch</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Diem</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Hänsch</surname> <given-names>W</given-names></name>, <name name-style="western"><surname>Naumann</surname> <given-names>D</given-names></name>. <article-title>Artificial neural networks as supervised techniques for FT-IR microspectroscopic imaging</article-title>. <source>Journal of chemometrics</source>. <year>2006</year>;<volume>20</volume>(<issue>5</issue>):<fpage>209</fpage>–<lpage>220</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/cem.993" xlink:type="simple">10.1002/cem.993</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0205219.ref009">
<label>9</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Fernandez</surname> <given-names>DC</given-names></name>, <name name-style="western"><surname>Bhargava</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Hewitt</surname> <given-names>SM</given-names></name>, <name name-style="western"><surname>Levin</surname> <given-names>IW</given-names></name>. <article-title>Infrared spectroscopic imaging for histopathologic recognition</article-title>. <source>Nature biotechnology</source>. <year>2005</year>;<volume>23</volume>(<issue>4</issue>):<fpage>469</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/nbt1080" xlink:type="simple">10.1038/nbt1080</ext-link></comment> <object-id pub-id-type="pmid">15793574</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref010">
<label>10</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Krafft</surname> <given-names>C</given-names></name>, <name name-style="western"><surname>Shapoval</surname> <given-names>L</given-names></name>, <name name-style="western"><surname>Sobottka</surname> <given-names>SB</given-names></name>, <name name-style="western"><surname>Geiger</surname> <given-names>KD</given-names></name>, <name name-style="western"><surname>Schackert</surname> <given-names>G</given-names></name>, <name name-style="western"><surname>Salzer</surname> <given-names>R</given-names></name>. <article-title>Identification of primary tumors of brain metastases by SIMCA classification of IR spectroscopic images</article-title>. <source>Biochimica et Biophysica Acta (BBA)-Biomembranes</source>. <year>2006</year>;<volume>1758</volume>(<issue>7</issue>):<fpage>883</fpage>–<lpage>891</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.bbamem.2006.05.001" xlink:type="simple">10.1016/j.bbamem.2006.05.001</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0205219.ref011">
<label>11</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bassan</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Sachdeva</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Shanks</surname> <given-names>JH</given-names></name>, <name name-style="western"><surname>Brown</surname> <given-names>MD</given-names></name>, <name name-style="western"><surname>Clarke</surname> <given-names>NW</given-names></name>, <name name-style="western"><surname>Gardner</surname> <given-names>P</given-names></name>. <article-title>Automated high-throughput assessment of prostate biopsy tissue using infrared spectroscopic chemical imaging</article-title>. In: <source>Proc SPIE</source>. <volume>vol. 9041</volume>; <year>2014</year>. p. <fpage>90410D</fpage>–<lpage>90416D</lpage>.</mixed-citation>
</ref>
<ref id="pone.0205219.ref012">
<label>12</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Fabian</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Thi</surname> <given-names>NAN</given-names></name>, <name name-style="western"><surname>Eiden</surname> <given-names>M</given-names></name>, <name name-style="western"><surname>Lasch</surname> <given-names>P</given-names></name>, <name name-style="western"><surname>Schmitt</surname> <given-names>J</given-names></name>, <name name-style="western"><surname>Naumann</surname> <given-names>D</given-names></name>. <article-title>Diagnosing benign and malignant lesions in breast tissue sections by using IR-microspectroscopy</article-title>. <source>Biochimica et Biophysica Acta (BBA)-Biomembranes</source>. <year>2006</year>;<volume>1758</volume>(<issue>7</issue>):<fpage>874</fpage>–<lpage>882</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.bbamem.2006.05.015" xlink:type="simple">10.1016/j.bbamem.2006.05.015</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0205219.ref013">
<label>13</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Bhargava</surname> <given-names>R</given-names></name>. <article-title>Towards a practical Fourier transform infrared chemical imaging protocol for cancer histopathology</article-title>. <source>Analytical and bioanalytical chemistry</source>. <year>2007</year>;<volume>389</volume>(<issue>4</issue>):<fpage>1155</fpage>–<lpage>1169</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s00216-007-1511-9" xlink:type="simple">10.1007/s00216-007-1511-9</ext-link></comment> <object-id pub-id-type="pmid">17786414</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref014">
<label>14</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Pounder</surname> <given-names>FN</given-names></name>, <name name-style="western"><surname>Reddy</surname> <given-names>RK</given-names></name>, <name name-style="western"><surname>Bhargava</surname> <given-names>R</given-names></name>. <article-title>Development of a practical spatial-spectral analysis protocol for breast histopathology using Fourier transform infrared spectroscopic imaging</article-title>. <source>Faraday discussions</source>. <year>2016</year>;<volume>187</volume>:<fpage>43</fpage>–<lpage>68</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1039/c5fd00199d" xlink:type="simple">10.1039/c5fd00199d</ext-link></comment> <object-id pub-id-type="pmid">27095431</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref015">
<label>15</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Leslie</surname> <given-names>LS</given-names></name>, <name name-style="western"><surname>Wrobel</surname> <given-names>TP</given-names></name>, <name name-style="western"><surname>Mayerich</surname> <given-names>D</given-names></name>, <name name-style="western"><surname>Bindra</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Emmadi</surname> <given-names>R</given-names></name>, <name name-style="western"><surname>Bhargava</surname> <given-names>R</given-names></name>. <article-title>High definition infrared spectroscopic imaging for lymph node histopathology</article-title>. <source>PloS one</source>. <year>2015</year>;<volume>10</volume>(<issue>6</issue>):<fpage>e0127238</fpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1371/journal.pone.0127238" xlink:type="simple">10.1371/journal.pone.0127238</ext-link></comment> <object-id pub-id-type="pmid">26039216</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref016">
<label>16</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Reddy</surname> <given-names>RK</given-names></name>, <name name-style="western"><surname>Walsh</surname> <given-names>MJ</given-names></name>, <name name-style="western"><surname>Schulmerich</surname> <given-names>MV</given-names></name>, <name name-style="western"><surname>Carney</surname> <given-names>PS</given-names></name>, <name name-style="western"><surname>Bhargava</surname> <given-names>R</given-names></name>. <article-title>High-definition infrared spectroscopic imaging</article-title>. <source>Applied spectroscopy</source>. <year>2013</year>;<volume>67</volume>(<issue>1</issue>):<fpage>93</fpage>–<lpage>105</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1366/11-06568" xlink:type="simple">10.1366/11-06568</ext-link></comment> <object-id pub-id-type="pmid">23317676</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref017">
<label>17</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Sreedhar</surname> <given-names>H</given-names></name>, <name name-style="western"><surname>Varma</surname> <given-names>VK</given-names></name>, <name name-style="western"><surname>Nguyen</surname> <given-names>PL</given-names></name>, <name name-style="western"><surname>Davidson</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Akkina</surname> <given-names>S</given-names></name>, <name name-style="western"><surname>Guzman</surname> <given-names>G</given-names></name>, <etal>et al</etal>. <article-title>High-definition Fourier transform infrared (FT-IR) spectroscopic imaging of human tissue sections towards improving pathology</article-title>. <source>Journal of visualized experiments: JoVE</source>. <year>2015</year>;(<issue>95</issue>). <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3791/52332" xlink:type="simple">10.3791/52332</ext-link></comment> <object-id pub-id-type="pmid">25650759</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref018">
<label>18</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Pilling</surname> <given-names>MJ</given-names></name>, <name name-style="western"><surname>Henderson</surname> <given-names>A</given-names></name>, <name name-style="western"><surname>Bird</surname> <given-names>B</given-names></name>, <name name-style="western"><surname>Brown</surname> <given-names>MD</given-names></name>, <name name-style="western"><surname>Clarke</surname> <given-names>NW</given-names></name>, <name name-style="western"><surname>Gardner</surname> <given-names>P</given-names></name>. <article-title>High-throughput quantum cascade laser (QCL) spectral histopathology: a practical approach towards clinical translation</article-title>. <source>Faraday discussions</source>. <year>2016</year>;<volume>187</volume>:<fpage>135</fpage>–<lpage>154</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1039/c5fd00176e" xlink:type="simple">10.1039/c5fd00176e</ext-link></comment> <object-id pub-id-type="pmid">27095185</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref019">
<label>19</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Anastasio</surname> <given-names>MA</given-names></name>, <name name-style="western"><surname>La Riviere</surname> <given-names>P</given-names></name>. <source>Emerging imaging technologies in medicine</source>. <publisher-name>CRC Press</publisher-name>; <year>2012</year>.</mixed-citation>
</ref>
<ref id="pone.0205219.ref020">
<label>20</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Reddy</surname> <given-names>RK</given-names></name>, <name name-style="western"><surname>Bhargava</surname> <given-names>R</given-names></name>. <article-title>Accurate histopathology from low signal-to-noise ratio spectroscopic imaging data</article-title>. <source>Analyst</source>. <year>2010</year>;<volume>135</volume>(<issue>11</issue>):<fpage>2818</fpage>–<lpage>2825</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1039/c0an00350f" xlink:type="simple">10.1039/c0an00350f</ext-link></comment> <object-id pub-id-type="pmid">20830324</object-id></mixed-citation>
</ref>
<ref id="pone.0205219.ref021">
<label>21</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Lee</surname> <given-names>JB</given-names></name>, <name name-style="western"><surname>Woodyatt</surname> <given-names>AS</given-names></name>, <name name-style="western"><surname>Berman</surname> <given-names>M</given-names></name>. <article-title>Enhancement of high spectral resolution remote-sensing data by a noise-adjusted principal components transform</article-title>. <source>Geoscience and Remote Sensing, IEEE Transactions on</source>. <year>1990</year>;<volume>28</volume>(<issue>3</issue>):<fpage>295</fpage>–<lpage>304</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/36.54356" xlink:type="simple">10.1109/36.54356</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0205219.ref022">
<label>22</label>
<mixed-citation publication-type="book" xlink:type="simple">
<name name-style="western"><surname>Bushberg</surname> <given-names>JT</given-names></name>, <name name-style="western"><surname>Boone</surname> <given-names>JM</given-names></name>. <source>The essential physics of medical imaging</source>. <publisher-name>Lippincott Williams &amp; Wilkins</publisher-name>; <year>2011</year>.</mixed-citation>
</ref>
<ref id="pone.0205219.ref023">
<label>23</label>
<mixed-citation publication-type="other" xlink:type="simple">Musco C, Musco C. Stronger approximate singular value decomposition via the block lanczos and power methods. Advances in Neural Information Processing Systems (NIPS). 2015;.</mixed-citation>
</ref>
<ref id="pone.0205219.ref024">
<label>24</label>
<mixed-citation publication-type="journal" xlink:type="simple">
<name name-style="western"><surname>Halko</surname> <given-names>N</given-names></name>, <name name-style="western"><surname>Martinsson</surname> <given-names>PG</given-names></name>, <name name-style="western"><surname>Tropp</surname> <given-names>JA</given-names></name>. <article-title>Finding structure with randomness: Probabilistic algorithms for constructing approximate matrix decompositions</article-title>. <source>SIAM review</source>. <year>2011</year>;<volume>53</volume>(<issue>2</issue>):<fpage>217</fpage>–<lpage>288</lpage>. <comment>doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1137/090771806" xlink:type="simple">10.1137/090771806</ext-link></comment></mixed-citation>
</ref>
<ref id="pone.0205219.ref025">
<label>25</label>
<mixed-citation publication-type="other" xlink:type="simple">Kong X, Li K, Yang Q, Wenyin L, Yang MH. A new image quality metric for image auto-denoising. In: Proceedings of the IEEE International Conference on Computer Vision; 2013. p. 2888–2895.</mixed-citation>
</ref>
</ref-list>
</back>
</article>