OpenMS  2.4.0
FeatureFindingMetabo.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2018.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: Timo Sachsenberg $
32 // $Authors: Erhan Kenar, Holger Franken $
33 // --------------------------------------------------------------------------
34 
35 #pragma once
36 
42 
43 #include <vector>
44 #include <svm.h>
45 
46 namespace OpenMS
47 {
48 
57  class OPENMS_DLLAPI FeatureHypothesis
58  {
59 public:
62 
65 
68 
70  FeatureHypothesis& operator=(const FeatureHypothesis& rhs);
71 
72  // getter & setter
73  Size getSize() const;
74 
75  String getLabel() const;
76 
77  std::vector<String> getLabels() const;
78 
79  double getScore() const;
80 
81  void setScore(const double& score);
82 
83  SignedSize getCharge() const;
84 
85  void setCharge(const SignedSize& ch);
86 
87  std::vector<double> getAllIntensities(bool smoothed = false) const;
88 
89  std::vector<double> getAllCentroidMZ() const;
90 
91  std::vector<double> getAllCentroidRT() const;
92 
93  std::vector<double> getIsotopeDistances() const;
94 
95  double getCentroidMZ() const;
96 
97  double getCentroidRT() const;
98 
99  double getFWHM() const;
100 
102  void addMassTrace(const MassTrace&);
103  double getMonoisotopicFeatureIntensity(bool) const;
104  double getSummedFeatureIntensity(bool) const;
105 
106  Size getNumFeatPoints() const;
107  std::vector<ConvexHull2D> getConvexHulls() const;
108  std::vector< OpenMS::MSChromatogram > getChromatograms(UInt64 feature_id) const;
109 
110 private:
111 
112  // pointers of MassTraces contained in isotopic pattern
113  std::vector<const MassTrace*> iso_pattern_;
114 
115  double feat_score_;
116 
118  };
119 
120  class OPENMS_DLLAPI CmpMassTraceByMZ
121  {
122 public:
123 
124  bool operator()(const MassTrace& x, const MassTrace& y) const
125  {
126  return x.getCentroidMZ() < y.getCentroidMZ();
127  }
128 
129  };
130 
131  class OPENMS_DLLAPI CmpHypothesesByScore
132  {
133 public:
134 
135  bool operator()(const FeatureHypothesis& x, const FeatureHypothesis& y) const
136  {
137  return x.getScore() > y.getScore();
138  }
139 
140  };
141 
167  class OPENMS_DLLAPI FeatureFindingMetabo :
168  public DefaultParamHandler,
169  public ProgressLogger
170  {
171 public:
174 
176  ~FeatureFindingMetabo() override;
177 
179  void run(std::vector<MassTrace>& input_mtraces, FeatureMap& output_featmap, std::vector<std::vector< OpenMS::MSChromatogram > >& output_chromatograms);
180 
181 protected:
182  void updateMembers_() override;
183 
184 private:
193  double computeCosineSim_(const std::vector<double>&, const std::vector<double>&) const;
194 
197  double computeOLSCoeff_(const std::vector<double>&, const std::vector<double>&) const;
198 
211  int isLegalIsotopePattern_(const FeatureHypothesis& feat_hypo) const;
212 
213  void loadIsotopeModel_(const String&);
214 
235  double scoreMZ_(const MassTrace &, const MassTrace &, Size isotopic_position, Size charge) const;
236 
249  double scoreRT_(const MassTrace&, const MassTrace&) const;
250 
257  double computeAveragineSimScore_(const std::vector<double>& intensities, const double& molecular_weight) const;
258 
267  void findLocalFeatures_(const std::vector<const MassTrace*>& candidates, const double total_intensity, std::vector<FeatureHypothesis>& output_hypotheses) const;
268 
270  svm_model* isotope_filt_svm_;
271  std::vector<double> svm_feat_centers_;
272  std::vector<double> svm_feat_scales_;
273 
275 
281  double chrom_fwhm_;
282 
287 
291 
293  };
294 
295 }
296 
A more convenient string class.
Definition: String.h:57
Definition: FeatureFindingMetabo.h:131
double local_mz_range_
Definition: FeatureFindingMetabo.h:278
A container for features.
Definition: FeatureMap.h:93
String isotope_filtering_model_
Definition: FeatureFindingMetabo.h:285
bool operator()(const MassTrace &x, const MassTrace &y) const
Definition: FeatureFindingMetabo.h:124
ptrdiff_t SignedSize
Signed Size type e.g. used as pointer difference.
Definition: Types.h:134
std::vector< const MassTrace * > iso_pattern_
Definition: FeatureFindingMetabo.h:113
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:46
bool use_smoothed_intensities_
Definition: FeatureFindingMetabo.h:286
Internal structure used in FeatureFindingMetabo that keeps track of a feature hypothesis (isotope gro...
Definition: FeatureFindingMetabo.h:57
double local_rt_range_
parameter stuff
Definition: FeatureFindingMetabo.h:277
double chrom_fwhm_
Definition: FeatureFindingMetabo.h:281
double getCentroidMZ() const
Returns the centroid m/z.
Definition: MassTrace.h:178
bool enable_RT_filtering_
Definition: FeatureFindingMetabo.h:284
Definition: FeatureFindingMetabo.h:120
Size charge_upper_bound_
Definition: FeatureFindingMetabo.h:280
Size charge_lower_bound_
Definition: FeatureFindingMetabo.h:279
OPENMS_UINT64_TYPE UInt64
Unsigned integer type (64bit)
Definition: Types.h:77
bool remove_single_traces_
Definition: FeatureFindingMetabo.h:292
bool use_mz_scoring_C13_
Definition: FeatureFindingMetabo.h:288
SignedSize charge_
Definition: FeatureFindingMetabo.h:117
double feat_score_
Definition: FeatureFindingMetabo.h:115
bool report_chromatograms_
Definition: FeatureFindingMetabo.h:290
bool report_summed_ints_
Definition: FeatureFindingMetabo.h:283
std::vector< double > svm_feat_centers_
Definition: FeatureFindingMetabo.h:271
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
Base class for all classes that want to report their progress.
Definition: ProgressLogger.h:54
double total_intensity_
Definition: FeatureFindingMetabo.h:274
bool report_convex_hulls_
Definition: FeatureFindingMetabo.h:289
svm_model * isotope_filt_svm_
SVM parameters.
Definition: FeatureFindingMetabo.h:270
A base class for all classes handling default parameters.
Definition: DefaultParamHandler.h:91
bool operator()(const FeatureHypothesis &x, const FeatureHypothesis &y) const
Definition: FeatureFindingMetabo.h:135
std::vector< double > svm_feat_scales_
Definition: FeatureFindingMetabo.h:272
A container type that gathers peaks similar in m/z and moving along retention time.
Definition: MassTrace.h:61
Method for the assembly of mass traces belonging to the same isotope pattern, i.e., that are compatible in retention times, mass-to-charge ratios, and isotope abundances.
Definition: FeatureFindingMetabo.h:167