Home  · Classes  · Annotated Classes  · Modules  · Members  · Namespaces  · Related Pages
PeakTypeEstimator.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2017.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: Timo Sachsenberg $
32 // $Authors: Marc Sturm, Marcel Schilling $
33 // --------------------------------------------------------------------------
34 
35 #ifndef OPENMS_FORMAT_PEAKTYPEESTIMATOR_H
36 #define OPENMS_FORMAT_PEAKTYPEESTIMATOR_H
37 
39 
40 #include <cmath>
41 #include <numeric>
42 
43 namespace OpenMS
44 {
50  class OPENMS_DLLAPI PeakTypeEstimator
51  {
52 public:
58  template <typename PeakConstIterator>
59  SpectrumSettings::SpectrumType estimateType(const PeakConstIterator & begin, const PeakConstIterator & end) const
60  {
61  const Size MAX_SAMPLED_DISTANCES = 1000;
62  const double DISTANCE_VARIANCE_THRESHOLD = 0.5;
63 
64  // abort if there are less than 5 peak in the iterator range
65  if (end - begin < 5)
66  {
68  }
69 
70  double count(0);
71 
72  std::vector<double> distances;
73 
74  PeakConstIterator peak(begin);
75 
76  for (; peak->getIntensity() <= 0 && peak != end - 2; ++peak) // 1st positive intensity
77  {
78  }
79 
80  double scnd_last_mz(peak->getMZ());
81 
82  for (++peak; peak->getIntensity() <= 0 && peak != end - 1; ++peak) // 2nd positive intensity
83  {
84  }
85 
86  double last_mz(peak->getMZ());
87 
88  double last_dist(last_mz - scnd_last_mz);
89 
90  for (++peak; peak != end && count < MAX_SAMPLED_DISTANCES; ++peak) // max positive intensity
91  {
92  if (peak->getIntensity() > 0)
93  {
94  double mz(peak->getMZ());
95  double dist(mz - last_mz);
96  distances.push_back(std::min(last_dist, dist)); // min distances
97  ++count;
98  scnd_last_mz = last_mz;
99  last_mz = mz;
100  last_dist = dist;
101  }
102  }
103 
104  if (count < 4) // at least 4 distances for non-zero(!) intensity peaks
105  {
107  }
108 
109  double mean(std::accumulate(distances.begin(), distances.end(), 0) / count); // sum/size
110 
111  // calculate variance
112  double variance(0);
113  for (std::vector<double>::iterator value = distances.begin(); value != distances.end(); ++value)
114  {
115  double delta = (*value - mean);
116  variance += delta * delta;
117  }
118  variance /= count - 1;
119 
120  // calculate stdev
121  double standard_deviation(std::sqrt(variance));
122 
123  if (standard_deviation < DISTANCE_VARIANCE_THRESHOLD)
124  {
126  }
127  else
128  {
130  }
131  }
132 
133  };
134 
135 } // namespace OpenMS
136 
137 #endif // OPENMS_FORMAT_PEAKTYPEESTIMATOR_H
static double variance(IteratorType begin, IteratorType end, double mean=std::numeric_limits< double >::max())
Calculates the variance of a range of values.
Definition: StatisticFunctions.h:280
Peak data (also called centroided data or stick data)
Definition: SpectrumSettings.h:74
SpectrumType
Spectrum peak type.
Definition: SpectrumSettings.h:71
Raw data (also called profile data)
Definition: SpectrumSettings.h:75
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:47
Unknown spectrum type.
Definition: SpectrumSettings.h:73
static double mean(IteratorType begin, IteratorType end)
Calculates the mean of a range of values.
Definition: StatisticFunctions.h:135
SpectrumSettings::SpectrumType estimateType(const PeakConstIterator &begin, const PeakConstIterator &end) const
Estimates the peak type of the peaks in the iterator range based on the variance of inter-peak distan...
Definition: PeakTypeEstimator.h:59
Estimates if the data of a spectrum is raw data or peak data.
Definition: PeakTypeEstimator.h:50
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:128

OpenMS / TOPP release 2.3.0 Documentation generated on Tue Jan 9 2018 18:22:03 using doxygen 1.8.13