OpenMS  2.5.0
SvmTheoreticalSpectrumGeneratorTrainer.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2020.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: Timo Sachsenberg $
32 // $Authors: Sandro Andreotti $
33 // --------------------------------------------------------------------------
34 
35 #pragma once
36 
41 
44 #include <OpenMS/FORMAT/TextFile.h>
45 
46 namespace OpenMS
47 {
66  public DefaultParamHandler
67  {
70  typedef std::map<std::pair<IonType, Size>, std::vector<double> > ObservedIntensMap;
71 
73  void countIntensities_(const PeakSpectrum & spectrum,
74  const AASequence & annotation,
75  IonType type,
76  std::map<std::pair<IonType, Size>, std::vector<double> > & observed_intensities,
77  double tolerance,
78  Size number_of_regions
79  );
80 
82  void trainSecondaryTypes_(TextFile & info_outfile,
83  Size number_of_regions,
84  Size number_of_intensity_levels,
85  ObservedIntensMap & observed_intensities,
86  const std::vector<IonType> & ion_types,
87  const std::vector<bool> & is_primary
88  );
89 public:
90 
96 
99 
103 
106 
108  void trainModel(const PeakMap & spectra, const std::vector<AASequence> & annotations, String filename, Int precursor_charge);
109 
111  void normalizeIntensity(PeakSpectrum & S) const;
112 
113 protected:
114 
116  void writeTrainingFile_(std::vector<DescriptorSet> & training_input, std::vector<double> & training_output, String filename);
117 
118  };
119 }
120 
DefaultParamHandler.h
OpenMS::TOPPBase
Base class for TOPP applications.
Definition: TOPPBase.h:144
OpenMS::SvmTheoreticalSpectrumGeneratorTrainer::DescriptorSet
SvmTheoreticalSpectrumGenerator::DescriptorSet DescriptorSet
Definition: SvmTheoreticalSpectrumGeneratorTrainer.h:69
OpenMS::Param::copy
Param copy(const String &prefix, bool remove_prefix=false) const
Returns a new Param object containing all entries that start with prefix.
TextFile.h
SvmTheoreticalSpectrumGeneratorTrainer.h
OpenMS::Param::setValue
void setValue(const String &key, const DataValue &value, const String &description="", const StringList &tags=StringList())
Sets a value.
OpenMS::SvmTheoreticalSpectrumGeneratorTrainer
Train SVM models that are used by SvmTheoreticalSpectrumGenerator.
Definition: SvmTheoreticalSpectrumGeneratorTrainer.h:65
OpenMS::SvmTheoreticalSpectrumGeneratorTrainer::ObservedIntensMap
std::map< std::pair< IonType, Size >, std::vector< double > > ObservedIntensMap
Definition: SvmTheoreticalSpectrumGeneratorTrainer.h:70
OpenMS::MzMLFile
File adapter for MzML files.
Definition: MzMLFile.h:55
OpenMS::String
A more convenient string class.
Definition: String.h:58
OpenMS::MSExperiment::begin
Iterator begin()
Definition: MSExperiment.h:157
MzMLFile.h
OpenMS::MSExperiment
In-Memory representation of a mass spectrometry experiment.
Definition: MSExperiment.h:77
OpenMS::TextFile
This class provides some basic file handling methods for text files.
Definition: TextFile.h:46
OpenMS::Size
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
IdXMLFile.h
OpenMS::SvmTheoreticalSpectrumGeneratorTrainer::IonType
SvmTheoreticalSpectrumGenerator::IonType IonType
Definition: SvmTheoreticalSpectrumGeneratorTrainer.h:68
OpenMS::IDMapper::annotate
void annotate(PeakMap &map, const std::vector< PeptideIdentification > &peptide_ids, const std::vector< ProteinIdentification > &protein_ids, const bool clear_ids=false, const bool map_ms1=false)
Mapping method for peak maps.
OpenMS::DefaultParamHandler
A base class for all classes handling default parameters.
Definition: DefaultParamHandler.h:91
OpenMS::IdXMLFile::load
void load(const String &filename, std::vector< ProteinIdentification > &protein_ids, std::vector< PeptideIdentification > &peptide_ids)
Loads the identifications of an idXML file without identifier.
OpenMS
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:46
OpenMS::MzMLFile::load
void load(const String &filename, PeakMap &map)
Loads a map from a MzML file. Spectra and chromatograms are sorted by default (this can be disabled u...
OpenMS::MSExperiment::iterator
Base::iterator iterator
Definition: MSExperiment.h:124
int
OpenMS::DefaultParamHandler::setParameters
void setParameters(const Param &param)
Sets the parameters.
OpenMS::DefaultParamHandler::getDefaults
const Param & getDefaults() const
Non-mutable access to the default parameters.
IDMapper.h
main
int main(int argc, const char **argv)
Definition: INIFileEditor.cpp:73
MSExperiment.h
OpenMS::Param::remove
void remove(const String &key)
Remove the entry key or a section key (when suffix is ':')
SvmTheoreticalSpectrumGenerator.h
OpenMS::MSExperiment::end
Iterator end()
Definition: MSExperiment.h:167
OpenMS::SvmTheoreticalSpectrumGeneratorTrainer::trainModel
void trainModel(const PeakMap &spectra, const std::vector< AASequence > &annotations, String filename, Int precursor_charge)
trains an SVM for each ion_type and stores them in files <filename>_residue_loss_charge....
StandardDeclarations.h
OpenMS::Param
Management and storage of parameters / INI files.
Definition: Param.h:73
OpenMS::AASequence
Representation of a peptide/protein sequence.
Definition: AASequence.h:113
OpenMS::IDMapper
Annotates an MSExperiment, FeatureMap or ConsensusMap with peptide identifications.
Definition: IDMapper.h:66
OpenMS::MSSpectrum
The representation of a 1D spectrum.
Definition: MSSpectrum.h:67
OpenMS::SvmTheoreticalSpectrumGenerator::IonType
nested class
Definition: SvmTheoreticalSpectrumGenerator.h:82
StandardTypes.h
TOPPBase.h
MSSpectrum.h
OpenMS::IdXMLFile
Used to load and store idXML files.
Definition: IdXMLFile.h:63
OpenMS::SvmTheoreticalSpectrumGenerator::DescriptorSet
A set of descriptors for a single training row.
Definition: SvmTheoreticalSpectrumGenerator.h:140