OpenMS
Loading...
Searching...
No Matches
SequestInfile.h
Go to the documentation of this file.
1// Copyright (c) 2002-present, OpenMS Inc. -- EKU Tuebingen, ETH Zurich, and FU Berlin
2// SPDX-License-Identifier: BSD-3-Clause
3//
4// --------------------------------------------------------------------------
5// $Maintainer: Timo Sachsenberg $
6// $Authors: Martin Langwisch $
7// --------------------------------------------------------------------------
8
9#pragma once
10
12
13#include <map>
14
15
16namespace OpenMS
17{
25 class OPENMS_DLLAPI SequestInfile
26 {
27public:
30
32 SequestInfile(const SequestInfile & sequest_infile);
33
35 virtual ~SequestInfile();
36
38 SequestInfile & operator=(const SequestInfile & sequest_infile);
39
41 bool operator==(const SequestInfile & sequest_infile) const;
42
47 void store(const std::string & filename);
48
50 const std::string getEnzymeInfoAsString() const;
51
53 const std::string & getDatabase() const;
55 void setDatabase(const std::string & database);
56
58 const std::string & getNeutralLossesForIons() const;
60 void setNeutralLossesForIons(const std::string & neutral_losses_for_ions);
61
63 const std::string & getIonSeriesWeights() const;
65 void setIonSeriesWeights(const std::string & ion_series_weights);
66
68 const std::string & getPartialSequence() const;
70 void setPartialSequence(const std::string & partial_sequence);
71
73 const std::string & getSequenceHeaderFilter() const;
75 void setSequenceHeaderFilter(const std::string & sequence_header_filter);
76
78 const std::string & getProteinMassFilter() const;
80 void setProteinMassFilter(const std::string & protein_mass_filter);
81
82
84 float getPeakMassTolerance() const;
86 void setPeakMassTolerance(float peak_mass_tolerance);
87
91 void setPrecursorMassTolerance(float precursor_mass_tolerance);
92
94 float getMatchPeakTolerance() const;
96 void setMatchPeakTolerance(float match_peak_tolerance);
97
101 void setIonCutoffPercentage(float ion_cutoff_percentage);
102
106 void setPeptideMassUnit(Size peptide_mass_unit);
107
111 void setOutputLines(Size output_lines);
112
116 std::string getEnzymeName() const;
118 Size setEnzyme(const std::string& enzyme_name);
119
123 void setMaxAAPerModPerPeptide(Size max_aa_per_mod_per_peptide);
124
128 void setMaxModsPerPeptide(Size max_mods_per_peptide);
129
143 void setNucleotideReadingFrame(Size nucleotide_reading_frame);
144
148 void setMaxInternalCleavageSites(Size max_internal_cleavage_sites);
149
153 void setMatchPeakCount(Size match_peak_count);
154
158 void setMatchPeakAllowedError(Size match_peak_allowed_error);
159
160
164 void setShowFragmentIons(bool show_fragments);
165
169 void setPrintDuplicateReferences(bool print_duplicate_references);
170
174 void setRemovePrecursorNearPeaks(bool remove_precursor_near_peaks);
175
177 bool getMassTypeParent() const;
179 void setMassTypeParent(bool mass_type_parent);
180
184 void setMassTypeFragment(bool mass_type_fragment);
185
187 bool getNormalizeXcorr() const;
189 void setNormalizeXcorr(bool normalize_xcorr);
190
194 void setResiduesInUpperCase(bool residues_in_upper_case);
195
199 void addEnzymeInfo(std::vector<std::string> & enzyme_info);
200
202 const std::map<std::string, std::vector<std::string> > & getModifications() const;
203
215 void handlePTMs(const std::string & modification_line, const std::string & modifications_filename, const bool monoisotopic);
216
217protected:
219 const std::map<std::string, std::vector<std::string> > & getEnzymeInfo_() const;
220
223
224 std::map<std::string, std::vector<std::string> > enzyme_info_;
225 std::string database_;
226 std::string snd_database_;
229 std::string partial_sequence_;
232
237
257
258
266
267 std::map<std::string, std::vector<std::string> > PTMname_residues_mass_type_;
268 };
269
270} // namespace OpenMS
271
Definition SequestInfile.h:26
void setShowFragmentIons(bool show_fragments)
sets whether fragment ions shall be displayed
Size setEnzyme(const std::string &enzyme_name)
sets the enzyme used for cleavage (by means of the number from a list of enzymes)
void setProteinMassFilter(const std::string &protein_mass_filter)
sets the protein mass filter (either min and max mass, or mass and tolerance value in percent)
Size getMaxInternalCleavageSites() const
returns the maximum number of internal cleavage sites
void setOutputLines(Size output_lines)
sets the number of peptides to be displayed
bool getResiduesInUpperCase() const
returns whether residues are in upper case
void setMatchPeakTolerance(float match_peak_tolerance)
sets the match peak tolerance
float match_peak_tolerance_
minimum distance between two experimental peaks
Definition SequestInfile.h:235
void setMatchPeakAllowedError(Size match_peak_allowed_error)
sets the number of top abundant peaks that are allowed not to match with a theoretical peak
void setMaxAAPerModPerPeptide(Size max_aa_per_mod_per_peptide)
sets the maximum number of amino acids containing the same modification in a peptide
Size max_mods_per_peptide_
maximum number of modifications per peptide
Definition SequestInfile.h:242
std::string snd_database_
second database used
Definition SequestInfile.h:226
std::string neutral_losses_for_ions_
whether neutral losses are considered for the a-; b- and y-ions (e.g. 011 for b- and y-ions)
Definition SequestInfile.h:227
Size getMaxModsPerPeptide() const
returns the maximum number of modifications that are allowed in a peptide
void setDatabase(const std::string &database)
sets the used database
Size output_lines_
number of peptides to be displayed
Definition SequestInfile.h:239
void setPeakMassTolerance(float peak_mass_tolerance)
sets the peak mass tolerance
void setIonCutoffPercentage(float ion_cutoff_percentage)
sets the ion cutoff of the ratio matching theoretical peaks/theoretical peaks
void setNucleotideReadingFrame(Size nucleotide_reading_frame)
void setResiduesInUpperCase(bool residues_in_upper_case)
sets whether residues are in upper case
void setPrintDuplicateReferences(bool print_duplicate_references)
sets whether all proteins containing a found peptide should be displayed
const std::map< std::string, std::vector< std::string > > & getEnzymeInfo_() const
returns the enzyme list
void setMaxModsPerPeptide(Size max_mods_per_peptide)
set the maximum number of modifications that are allowed in a peptide
float ion_cutoff_percentage_
cutoff of the ratio matching theoretical peaks/theoretical peaks
Definition SequestInfile.h:236
void setSequenceHeaderFilter(const std::string &sequence_header_filter)
sets the sequences (space delimited) that have to occur, or be absent (preceded by a tilde) in the he...
float getPrecursorMassTolerance() const
returns the precursor mass tolerance
float precursor_mass_tolerance_
tolerance for matching a theoretical to an experimental peptide
Definition SequestInfile.h:233
std::string database_
database used
Definition SequestInfile.h:225
const std::string & getDatabase() const
returns the used database
void handlePTMs(const std::string &modification_line, const std::string &modifications_filename, const bool monoisotopic)
Size getEnzymeNumber() const
returns the enzyme used for cleavage (by means of the number from a list of enzymes)
void addEnzymeInfo(std::vector< std::string > &enzyme_info)
bool getRemovePrecursorNearPeaks() const
return whether peaks near (15 amu) the precursor peak are removed
void setNeutralLossesForIons(const std::string &neutral_losses_for_ions)
sets whether neutral losses are considered for the a-, b- and y-ions
void setRemovePrecursorNearPeaks(bool remove_precursor_near_peaks)
sets whether peaks near (15 amu) the precursor peak are removed
bool residues_in_upper_case_
whether residues are in upper case
Definition SequestInfile.h:265
Size max_internal_cleavage_sites_
maximum number of internal cleavage sites
Definition SequestInfile.h:254
float getIonCutoffPercentage() const
returns the the cutoff of the ratio matching theoretical peaks/theoretical peaks
Size nucleotide_reading_frame_
Definition SequestInfile.h:243
float peak_mass_tolerance_
tolerance for matching a theoretical to an experimental peak
Definition SequestInfile.h:234
const std::string & getPartialSequence() const
returns the partial sequences (space delimited) that have to occur in the theoretical spectra
const std::map< std::string, std::vector< std::string > > & getModifications() const
return the modifications (the modification names map to the affected residues, the mass change and th...
std::string ion_series_weights_
weights for the a-; b-; c-; d-; v-; w-; x-; y- and z-ion series; space delimited
Definition SequestInfile.h:228
Size getPeptideMassUnit() const
returns the peptide mass unit
const std::string & getNeutralLossesForIons() const
returns whether neutral losses are considered for the a-, b- and y-ions
std::string getEnzymeName() const
returns the enzyme used for cleavage
Size getMatchPeakCount() const
returns the number of top abundant peaks to match with theoretical ones
float getMatchPeakTolerance() const
returns the match peak tolerance
void setMassTypeParent(bool mass_type_parent)
sets the mass type of the parent (0 - monoisotopic, 1 - average mass)
bool getNormalizeXcorr() const
returns whether normalized xcorr values are displayed
Size peptide_mass_unit_
peptide mass unit (0 = amu; 1 = mmu; 2 = ppm)
Definition SequestInfile.h:238
bool remove_precursor_near_peaks_
whether peaks near (15 amu) the precursor peak are removed
Definition SequestInfile.h:261
std::map< std::string, std::vector< std::string > > enzyme_info_
an endline-delimited list of enzymes; each with cutting direction 0 (N to C) /1; cuts after (list of ...
Definition SequestInfile.h:224
std::string sequence_header_filter_
space-delimited list of sequences that have to occur or be absent (preceded by a tilde) in a protein ...
Definition SequestInfile.h:230
bool show_fragment_ions_
whether to display fragment ions
Definition SequestInfile.h:259
void setMatchPeakCount(Size match_peak_count)
sets the number of top abundant peaks to with theoretical ones
std::string protein_mass_filter_
Definition SequestInfile.h:231
Size getMaxAAPerModPerPeptide() const
returns the maximum number of amino acids containing the same modification in a peptide
Size match_peak_count_
number of the top abundant peaks to match with theoretical one
Definition SequestInfile.h:255
SequestInfile()
default constructor
const std::string getEnzymeInfoAsString() const
returns the enzyme list as a string
bool operator==(const SequestInfile &sequest_infile) const
equality operator
void store(const std::string &filename)
void setNormalizeXcorr(bool normalize_xcorr)
sets whether normalized xcorr values are displayed
SequestInfile & operator=(const SequestInfile &sequest_infile)
assignment operator
bool mass_type_parent_
mass type of the parent peak (0 - monoisotopic; 1 - average)
Definition SequestInfile.h:262
void setStandardEnzymeInfo_()
returns some standard enzymes (used to initialize the enzyme list)
void setIonSeriesWeights(const std::string &ion_series_weights)
sets the weights for the a-, b-, c-, d-, v-, w-, x-, y- and z-ion series
Size enzyme_number_
number of the enzyme used for cleavage
Definition SequestInfile.h:240
bool print_duplicate_references_
whether all proteins containing a found peptide should be displayed
Definition SequestInfile.h:260
void setPartialSequence(const std::string &partial_sequence)
sets the partial sequences (space delimited) that have to occur in the theoretical spectra
Size getNucleotideReadingFrame() const
returns the nucleotide reading frame
void setPrecursorMassTolerance(float precursor_mass_tolerance)
sets the precursor mass tolerance
Size getMatchPeakAllowedError() const
returns the number of top abundant peaks that are allowed not to match with a theoretical peak
const std::string & getSequenceHeaderFilter() const
returns the sequences (space delimited) that have to occur, or be absent (preceded by a tilde) in the...
virtual ~SequestInfile()
destructor
bool mass_type_fragment_
mass type of fragment peaks (0 - monoisotopic; 1 - average)
Definition SequestInfile.h:263
bool getShowFragmentIons() const
returns whether fragment ions shall be displayed
std::string partial_sequence_
space-delimited list of sequence parts that have to occur in the theoretical spectra
Definition SequestInfile.h:229
Size match_peak_allowed_error_
number of peaks that may lack this test
Definition SequestInfile.h:256
void setMassTypeFragment(bool mass_type_fragment)
sets the mass type of the fragments (0 - monoisotopic, 1 - average mass)
bool getMassTypeFragment() const
return the mass type of the fragments (0 - monoisotopic, 1 - average mass)
std::map< std::string, std::vector< std::string > > PTMname_residues_mass_type_
the modification names map to the affected residues, the mass change and the type
Definition SequestInfile.h:267
float getPeakMassTolerance() const
returns the peak mass tolerance
bool getPrintDuplicateReferences() const
returns whether all proteins containing a found peptide should be displayed
bool normalize_xcorr_
whether to display normalized xcorr values
Definition SequestInfile.h:264
void setPeptideMassUnit(Size peptide_mass_unit)
sets the peptide mass unit
Size max_AA_per_mod_per_peptide_
maximum number of amino acids containing the same modification in a peptide
Definition SequestInfile.h:241
const std::string & getIonSeriesWeights() const
returns the weights for the a-, b-, c-, d-, v-, w-, x-, y- and z-ion series
SequestInfile(const SequestInfile &sequest_infile)
copy constructor
const std::string & getProteinMassFilter() const
returns the protein mass filter (either min and max mass, or mass and tolerance value in percent)
bool getMassTypeParent() const
return the mass type of the parent (0 - monoisotopic, 1 - average mass)
Size getOutputLines() const
return the number of peptides to be displayed
void setMaxInternalCleavageSites(Size max_internal_cleavage_sites)
sets the maximum number of internal cleavage sites
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition Types.h:97
Main OpenMS namespace.
Definition openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19