OpenMS  2.6.0
InternalCalibration.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2020.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: Chris Bielow $
32 // $Authors: Chris Bielow $
33 // --------------------------------------------------------------------------
34 
35 #pragma once
36 
43 
44 #include <vector>
45 
46 namespace OpenMS
47 {
48 
49  class FeatureMap;
50 
61  class OPENMS_DLLAPI InternalCalibration
62  : public ProgressLogger
63  {
64  public:
65 
68 
71 
73  struct LockMass
74  {
75  double mz;
76  unsigned int ms_level;
77  int charge;
78 
79  LockMass(double mz_, int lvl_, int charge_)
80  : mz(mz_),
81  ms_level(lvl_),
82  charge(charge_)
83  {}
84  };
85 
108  Size fillCalibrants(const PeakMap exp,
109  const std::vector<InternalCalibration::LockMass>& ref_masses,
110  double tol_ppm,
111  bool lock_require_mono,
112  bool lock_require_iso,
113  CalibrationData& failed_lock_masses,
114  bool verbose = true);
115 
137  Size fillCalibrants(const FeatureMap& fm, double tol_ppm);
138 
154  Size fillCalibrants(const std::vector<PeptideIdentification>& pep_ids, double tol_ppm);
155 
164  const CalibrationData& getCalibrationPoints() const;
165 
190  bool calibrate(PeakMap& exp,
191  const IntList& target_mslvl,
192  MZTrafoModel::MODELTYPE model_type,
193  double rt_chunk,
194  bool use_RANSAC,
195  double post_ppm_median,
196  double post_ppm_MAD,
197  const String& file_models = "",
198  const String& file_models_plot = "",
199  const String& file_residuals = "",
200  const String& file_residuals_plot = "",
201  const String& rscript_executable = "Rscript");
202 
203  /*
204  @brief Transform a precursor's m/z
205 
206  Calibrate m/z of precursors.
207 
208  @param pcs Uncalibrated Precursors
209  @param trafo The calibration function to apply
210  */
211  static void applyTransformation(std::vector<Precursor>& pcs, const MZTrafoModel& trafo);
212 
213  /*
214  @brief Transform a spectrum (data+precursor)
215 
216  See applyTransformation(MSExperiment, ...) for details.
217 
218  @param spec Uncalibrated MSSpectrum
219  @param target_mslvl List (can be unsorted) of MS levels to calibrate
220  @param trafo The calibration function to apply
221  */
222  static void applyTransformation(PeakMap::SpectrumType& spec, const IntList& target_mslvl, const MZTrafoModel& trafo);
223 
224  /*
225  @brief Transform spectra from a whole map (data+precursor)
226 
227  All data peaks and precursor information (if present) are calibrated in m/z.
228 
229  Only spectra whose MS-level is contained in 'target_mslvl' are calibrated.
230  In addition, if a fragmentation spectrum's precursor information originates from an MS level in 'target_mslvl',
231  the precursor (not the spectrum itself) is also subjected to calibration.
232  E.g., If we only have MS and MS/MS spectra: for 'target_mslvl' = {1} then all MS1 spectra and MS2 precursors are calibrated.
233  If 'target_mslvl' = {2}, only MS2 spectra (not their precursors) are calibrated.
234  If 'target_mslvl' = {1,2} all spectra and precursors are calibrated.
235 
236 
237  @param exp Uncalibrated peak map
238  @param target_mslvl List (can be unsorted) of MS levels to calibrate
239  @param trafo The calibration function to apply
240  */
241  static void applyTransformation(PeakMap& exp, const IntList& target_mslvl, const MZTrafoModel& trafo);
242 
243  protected:
244 
247  {
248  CalibrantStats_(const double tol_ppm)
249  : tol_ppm_(tol_ppm)
250  {};
251  Size cnt_empty = 0;
252  Size cnt_nomz = 0;
253  Size cnt_nort = 0;
254  Size cnt_decal = 0;
255  Size cnt_total = 0;
256 
257  void print() const
258  {
259  if (cnt_empty > 0) OPENMS_LOG_WARN << "Warning: " << cnt_empty << "/" << cnt_total << " calibrations points were skipped, since they have no peptide sequence!" << std::endl;
260  if (cnt_nomz > 0) OPENMS_LOG_WARN << "Warning: " << cnt_nomz << "/" << cnt_total << " calibrations points were skipped, since they have no m/z value!" << std::endl;
261  if (cnt_nort > 0) OPENMS_LOG_WARN << "Warning: " << cnt_nort << "/" << cnt_total << " calibrations points were skipped, since they have no RT value!" << std::endl;
262  if (cnt_decal > 0) OPENMS_LOG_WARN << "Warning: " << cnt_decal << "/" << cnt_total << " calibrations points were skipped, since their theoretical weight is more than " << tol_ppm_ << " ppm away from their measured mass!" << std::endl;
263  }
264 
265  private:
266  const double tol_ppm_;
267  };
268 
285  void fillID_( const PeptideIdentification& pep_id, const double tol_ppm, CalibrantStats_& stats);
286 
288  void fillIDs_(const std::vector<PeptideIdentification>& pep_ids, const double tol_ppm, CalibrantStats_& stats);
289 
291  bool isDecalibrated_(const PeptideIdentification& pep_id, const double mz_obs, const double tol_ppm, CalibrantStats_& stats, double& mz_ref);
292 
293  /*
294  @brief Calibrate m/z of a spectrum, ignoring precursors!
295 
296  This method is not exposed as public, because its easy to be misused on spectra while forgetting about the precursors of high-level spectra.
297  */
298  static void applyTransformation_(PeakMap::SpectrumType& spec, const MZTrafoModel& trafo);
299 
300  private:
302  }; // class InternalCalibration
303 
304 } // namespace OpenMS
305 
OpenMS::InternalCalibration::CalibrantStats_::CalibrantStats_
CalibrantStats_(const double tol_ppm)
Definition: InternalCalibration.h:248
OpenMS::FileTypes::IDXML
OpenMS identification format (.idXML)
Definition: FileTypes.h:66
OpenMS::TOPPBase
Base class for TOPP applications.
Definition: TOPPBase.h:144
OpenMS::MZTrafoModel::setRANSACParams
static void setRANSACParams(const Math::RANSACParam &p)
Set the global (program wide) parameters for RANSAC.
OpenMS::TextFile::end
ConstIterator end() const
Gives access to the underlying text buffer.
OpenMS::MSExperiment::set2DData
void set2DData(const Container &container)
Assignment of a data container with RT and MZ to an MSExperiment.
Definition: MSExperiment.h:246
FileHandler.h
FileTypes.h
TextFile.h
OpenMS::InternalCalibration::CalibrantStats_::tol_ppm_
const double tol_ppm_
tolerance used for counting cnt_decal
Definition: InternalCalibration.h:266
OpenMS::MzMLFile::store
void store(const String &filename, const PeakMap &map) const
Stores a map in an MzML file.
OpenMS::MZTrafoModel::setCoefficientLimits
static void setCoefficientLimits(double offset, double scale, double power)
Set coefficient boundaries for which the model coefficient must not exceed to be considered a valid m...
OpenMS::MZTrafoModel::MODELTYPE
MODELTYPE
Definition: MZTrafoModel.h:98
InternalCalibration.h
OpenMS::Math::RANSACParam
A simple struct to carry all the parameters required for a RANSAC run.
Definition: RANSAC.h:58
OpenMS::InternalCalibration::CalibrantStats_
statistics when adding peptide calibrants
Definition: InternalCalibration.h:246
OpenMS::MzMLFile
File adapter for MzML files.
Definition: MzMLFile.h:55
OpenMS::String
A more convenient string class.
Definition: String.h:59
MzMLFile.h
OpenMS::MSExperiment
In-Memory representation of a mass spectrometry experiment.
Definition: MSExperiment.h:77
OpenMS::FileHandler::getTypeByContent
static FileTypes::Type getTypeByContent(const String &filename)
Determines the file type of a file by parsing the first few lines.
OpenMS::TextFile
This class provides some basic file handling methods for text files.
Definition: TextFile.h:46
OpenMS::Size
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
IdXMLFile.h
FeatureXMLFile.h
OpenMS::InternalCalibration::LockMass
helper class, describing a lock mass
Definition: InternalCalibration.h:73
OpenMS::InternalCalibration::LockMass::charge
int charge
charge of the ion (to find isotopes)
Definition: InternalCalibration.h:77
OpenMS::InternalCalibration::LockMass::mz
double mz
m/z of the lock mass (incl. adducts)
Definition: InternalCalibration.h:75
OpenMS::IntList
std::vector< Int > IntList
Vector of signed integers.
Definition: ListUtils.h:55
OPENMS_LOG_WARN
#define OPENMS_LOG_WARN
Macro if a warning, a piece of information which should be read by the user, should be logged.
Definition: LogStream.h:460
OpenMS::InternalCalibration
A mass recalibration method using linear/quadratic interpolation (robust/weighted) of given reference...
Definition: InternalCalibration.h:61
MZTrafoModel.h
OpenMS::String::hasSubstring
bool hasSubstring(const String &string) const
true if String contains the string, false otherwise
ListUtils.h
OpenMS::CalibrationData::getMetaValues
static StringList getMetaValues()
List of meta-values which are used internally (for conversion to PeakMap).
OpenMS::IdXMLFile::load
void load(const String &filename, std::vector< ProteinIdentification > &protein_ids, std::vector< PeptideIdentification > &peptide_ids)
Loads the identifications of an idXML file without identifier.
OpenMS::MZTrafoModel::enumToName
static const std::string & enumToName(MODELTYPE mt)
Convert enum to string.
OpenMS::InternalCalibration::calibrate
bool calibrate(PeakMap &exp, const IntList &target_mslvl, MZTrafoModel::MODELTYPE model_type, double rt_chunk, bool use_RANSAC, double post_ppm_median, double post_ppm_MAD, const String &file_models="", const String &file_models_plot="", const String &file_residuals="", const String &file_residuals_plot="", const String &rscript_executable="Rscript")
Apply calibration to data.
OpenMS
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:46
OpenMS::FileTypes::FEATUREXML
OpenMS feature file (.featureXML)
Definition: FileTypes.h:65
OpenMS::ProgressLogger
Base class for all classes that want to report their progress.
Definition: ProgressLogger.h:54
ProgressLogger.h
OpenMS::MzMLFile::load
void load(const String &filename, PeakMap &map)
Loads a map from a MzML file. Spectra and chromatograms are sorted by default (this can be disabled u...
TransformationXMLFile.h
OpenMS::InternalCalibration::LockMass::LockMass
LockMass(double mz_, int lvl_, int charge_)
Definition: InternalCalibration.h:79
int
OpenMS::FileHandler
Facilitates file handling by file type recognition.
Definition: FileHandler.h:62
OpenMS::FeatureXMLFile::load
void load(const String &filename, FeatureMap &feature_map)
loads the file with name filename into map and calls updateRanges().
FeatureMap.h
OpenMS::FileTypes::Type
Type
Actual file types enum.
Definition: FileTypes.h:58
OpenMS::MZTrafoModel::LINEAR_WEIGHTED
Definition: MZTrafoModel.h:98
OpenMS::DataProcessing::CALIBRATION
Calibration of m/z positions.
Definition: DataProcessing.h:69
OpenMS::CalibrationData::empty
bool empty() const
Do we have any calibration points.
main
int main(int argc, const char **argv)
Definition: INIFileEditor.cpp:73
OpenMS::InternalCalibration::cal_data_
CalibrationData cal_data_
Definition: InternalCalibration.h:301
MSExperiment.h
OpenMS::TextFile::begin
ConstIterator begin() const
Gives access to the underlying text buffer.
OpenMS::Internal::ClassTest::verbose
int verbose
Verbosity level ( "-v" is 1 and "-V" is 2 )
OpenMS::MZTrafoModel::SIZE_OF_MODELTYPE
Definition: MZTrafoModel.h:98
OpenMS::InternalCalibration::fillCalibrants
Size fillCalibrants(const PeakMap exp, const std::vector< InternalCalibration::LockMass > &ref_masses, double tol_ppm, bool lock_require_mono, bool lock_require_iso, CalibrationData &failed_lock_masses, bool verbose=true)
Extract calibrants from Raw data (mzML)
OPENMS_LOG_ERROR
#define OPENMS_LOG_ERROR
Macro to be used if non-fatal error are reported (processing continues)
Definition: LogStream.h:455
OpenMS::FeatureMap
A container for features.
Definition: FeatureMap.h:97
OpenMS::PeptideIdentification
Represents the peptide hits for a spectrum.
Definition: PeptideIdentification.h:62
OpenMS::InternalCalibration::~InternalCalibration
~InternalCalibration()
Destructor.
Definition: InternalCalibration.h:70
OpenMS::InternalCalibration::CalibrantStats_::print
void print() const
Definition: InternalCalibration.h:257
OpenMS::MZTrafoModel
Create and apply models of a mass recalibration function.
Definition: MZTrafoModel.h:66
OpenMS::FeatureXMLFile
This class provides Input/Output functionality for feature maps.
Definition: FeatureXMLFile.h:68
OpenMS::InternalCalibration::LockMass::ms_level
unsigned int ms_level
MS level where it occurs.
Definition: InternalCalibration.h:76
OpenMS::MZTrafoModel::nameToEnum
static MODELTYPE nameToEnum(const std::string &name)
Convert string to enum.
CalibrationData.h
OpenMS::Exception::MissingInformation
Not all required information provided.
Definition: Exception.h:195
OPENMS_LOG_INFO
#define OPENMS_LOG_INFO
Macro if a information, e.g. a status should be reported.
Definition: LogStream.h:465
OpenMS::MSSpectrum
The representation of a 1D spectrum.
Definition: MSSpectrum.h:67
OpenMS::CalibrationData
A helper class, holding all calibration points.
Definition: CalibrationData.h:64
OpenMS::TextFile::ConstIterator
std::vector< String >::const_iterator ConstIterator
Non-mutable iterator.
Definition: TextFile.h:56
OpenMS::MZTrafoModel::names_of_modeltype
static const std::string names_of_modeltype[]
strings corresponding to enum MODELTYPE
Definition: MZTrafoModel.h:99
OpenMS::TextFile::load
void load(const String &filename, bool trim_lines=false, Int first_n=-1, bool skip_empty_lines=false)
Loads data from a text file.
StandardTypes.h
OpenMS::ProgressLogger::setLogType
void setLogType(LogType type) const
Sets the progress log that should be used. The default type is NONE!
TOPPBase.h
OpenMS::InternalCalibration::getCalibrationPoints
const CalibrationData & getCalibrationPoints() const
Get container of calibration points.
OpenMS::IdXMLFile
Used to load and store idXML files.
Definition: IdXMLFile.h:63