nightly/html/EmgScoring_8h_source.html

// Copyright (c) 2002-present, OpenMS Inc. -- EKU Tuebingen, ETH Zurich, and FU Berlin

// SPDX-License-Identifier: BSD-3-Clause

//

// --------------------------------------------------------------------------

// $Maintainer: Hannes Roest $

// $Authors: Hannes Roest $

// --------------------------------------------------------------------------


#pragma once


#include <OpenMS/FEATUREFINDER/EmgFitter1D.h>

#include <OpenMS/FEATUREFINDER/EmgModel.h>

#include <OpenMS/PROCESSING/SMOOTHING/GaussFilter.h>


#include <OpenMS/KERNEL/MRMFeature.h>

#include <OpenMS/KERNEL/MRMTransitionGroup.h>

#include <OpenMS/KERNEL/MSSpectrum.h>


#include <OpenMS/KERNEL/StandardTypes.h>


#include <vector>

#include <cmath> // for isnan


namespace OpenMS

{


  class EmgScoring

  {


  public :


    EmgScoring() = default;


    ~EmgScoring() = default;


    void setFitterParam(const Param& param)

    {

      fitter_emg1D_params_ = param;

    }


    Param getDefaults()

    {

      return EmgFitter1D().getDefaults();

    }


    template<typename SpectrumType, class TransitionT>


    double calcElutionFitScore(MRMFeature & mrmfeature, MRMTransitionGroup<SpectrumType, TransitionT> & transition_group) const

    {

      double avg_score = 0;

      bool smooth_data = false;


      for (Size k = 0; k < transition_group.size(); k++)

      {

        // get the id, then find the corresponding transition and features within this peakgroup

        String native_id = transition_group.getChromatograms()[k].getNativeID();

        Feature f = mrmfeature.getFeature(native_id);

        OPENMS_PRECONDITION(f.getConvexHulls().size() == 1, "Convex hulls need to have exactly one hull point structure");


        //TODO think about penalizing aborted fits even more. Currently -1 is just the "lowest" pearson correlation to

        // a fit that you can have.

        double fscore = elutionModelFit(f.getConvexHulls()[0].getHullPoints(), smooth_data);

        avg_score += fscore;

      }


      avg_score /= transition_group.size();

      return avg_score;

    }


    // Fxn from FeatureFinderAlgorithmMRM

    // TODO: check whether we can leave out some of the steps here, e.g. gaussian smoothing


    double elutionModelFit(const ConvexHull2D::PointArrayType& current_section, bool smooth_data) const

    {

      // We need at least 2 datapoints in order to create a fit

      if (current_section.size() < 2)

      {

        return -1;

      }


      // local PeakType is a small hack since here we *need* data of type

      // Peak1D, otherwise our fitter will not accept it.

      typedef Peak1D LocalPeakType;


      // -- cut line 301 of FeatureFinderAlgorithmMRM

      std::vector<LocalPeakType> data_to_fit;

      prepareFit_(current_section, data_to_fit, smooth_data);

      std::unique_ptr<InterpolationModel> model_rt;

      double quality = fitRT_(data_to_fit, model_rt);

      // cut line 354 of FeatureFinderAlgorithmMRM


      return quality;

    }


  protected:

    template<class LocalPeakType>


    double fitRT_(std::vector<LocalPeakType>& rt_input_data, std::unique_ptr<InterpolationModel>& model) const

    {

      EmgFitter1D fitter_emg1D;

      fitter_emg1D.setParameters(fitter_emg1D_params_);

      // Construct model for rt

      // NaN is checked in fit1d: if (std::isnan(quality)) quality = -1.0;

      return fitter_emg1D.fit1d(rt_input_data, model);

    }


    // Fxn from FeatureFinderAlgorithmMRM

    // TODO: check whether we can leave out some of the steps here, e.g. gaussian smoothing

    template<class LocalPeakType>


    void prepareFit_(const ConvexHull2D::PointArrayType & current_section, std::vector<LocalPeakType> & data_to_fit, bool smooth_data) const

    {

      // typedef Peak1D LocalPeakType;

      PeakSpectrum filter_spec;

      // first smooth the data to prevent outliers from destroying the fit

      for (const auto& pa : current_section)

      {

        LocalPeakType p;

        using IntensityType = typename LocalPeakType::IntensityType;

        p.setMZ(pa.getX());

        p.setIntensity(IntensityType(pa.getY()));

        filter_spec.push_back(p);

      }


      // add two peaks at the beginning and at the end for better fit

      // therefore calculate average distance first

      std::vector<double> distances;

      for (Size j = 1; j < filter_spec.size(); ++j)

      {

        distances.push_back(filter_spec[j].getMZ() - filter_spec[j - 1].getMZ());

      }

      double dist_average = std::accumulate(distances.begin(), distances.end(), 0.0) / (double) distances.size();


      // append peaks

      Peak1D new_peak;

      new_peak.setIntensity(0);

      new_peak.setMZ(filter_spec.back().getMZ() + dist_average);

      filter_spec.push_back(new_peak);

      new_peak.setMZ(filter_spec.back().getMZ() + dist_average);

      filter_spec.push_back(new_peak);

      new_peak.setMZ(filter_spec.back().getMZ() + dist_average);

      filter_spec.push_back(new_peak);


      // prepend peaks

      new_peak.setMZ(filter_spec.front().getMZ() - dist_average);

      filter_spec.insert(filter_spec.begin(), new_peak);

      new_peak.setMZ(filter_spec.front().getMZ() - dist_average);

      filter_spec.insert(filter_spec.begin(), new_peak);

      new_peak.setMZ(filter_spec.front().getMZ() - dist_average);

      filter_spec.insert(filter_spec.begin(), new_peak);


      // To get an estimate of the peak quality, we probably should not smooth

      // and/or transform the data.

      if (smooth_data)

      {

        GaussFilter filter;

        Param filter_param(filter.getParameters());

        filter.setParameters(filter_param);

        filter_param.setValue("gaussian_width", 4 * dist_average);

        filter.setParameters(filter_param);

        filter.filter(filter_spec);

      }


      // transform the data for fitting and fit RT profile

      for (Size j = 0; j != filter_spec.size(); ++j)

      {

        LocalPeakType p;

        p.setPosition(filter_spec[j].getMZ());

        p.setIntensity(filter_spec[j].getIntensity());

        data_to_fit.push_back(p);

      }

    }


    Param fitter_emg1D_params_;

  };


}


EmgFitter1D.h

EmgModel.h

GaussFilter.h

MRMFeature.h

MRMTransitionGroup.h

MSSpectrum.h

StandardTypes.h

OpenMS::ConvexHull2D::PointArrayType
std::vector< PointType > PointArrayType
Definition ConvexHull2D.h:52

OpenMS::DefaultParamHandler::getParameters
const Param & getParameters() const
Non-mutable access to the parameters.

OpenMS::DefaultParamHandler::getDefaults
const Param & getDefaults() const
Non-mutable access to the default parameters.

OpenMS::DefaultParamHandler::setParameters
void setParameters(const Param &param)
Sets the parameters.

OpenMS::EmgFitter1D
Exponentially modified gaussian distribution fitter (1-dim.) using Levenberg-Marquardt algorithm (Eig...
Definition EmgFitter1D.h:23

OpenMS::EmgFitter1D::fit1d
QualityType fit1d(const RawDataArrayType &range, std::unique_ptr< InterpolationModel > &model) override
return interpolation model

OpenMS::EmgScoring
Scoring of an elution peak using an exponentially modified gaussian distribution model.
Definition EmgScoring.h:35

OpenMS::EmgScoring::EmgScoring
EmgScoring()=default

OpenMS::EmgScoring::setFitterParam
void setFitterParam(const Param &param)
Definition EmgScoring.h:45

OpenMS::EmgScoring::elutionModelFit
double elutionModelFit(const ConvexHull2D::PointArrayType &current_section, bool smooth_data) const
Definition EmgScoring.h:82

OpenMS::EmgScoring::fitter_emg1D_params_
Param fitter_emg1D_params_
Definition EmgScoring.h:181

OpenMS::EmgScoring::getDefaults
Param getDefaults()
Get default params for the Emg1D fitting.
Definition EmgScoring.h:51

OpenMS::EmgScoring::calcElutionFitScore
double calcElutionFitScore(MRMFeature &mrmfeature, MRMTransitionGroup< SpectrumType, TransitionT > &transition_group) const
calculate the elution profile fit score
Definition EmgScoring.h:58

OpenMS::EmgScoring::fitRT_
double fitRT_(std::vector< LocalPeakType > &rt_input_data, std::unique_ptr< InterpolationModel > &model) const
Definition EmgScoring.h:106

OpenMS::EmgScoring::~EmgScoring
~EmgScoring()=default

OpenMS::EmgScoring::prepareFit_
void prepareFit_(const ConvexHull2D::PointArrayType &current_section, std::vector< LocalPeakType > &data_to_fit, bool smooth_data) const
Definition EmgScoring.h:118

OpenMS::Feature
An LC-MS feature.
Definition Feature.h:46

OpenMS::Feature::getConvexHulls
const std::vector< ConvexHull2D > & getConvexHulls() const
Non-mutable access to the convex hulls.

OpenMS::GaussFilter
This class represents a Gaussian lowpass-filter which works on uniform as well as on non-uniform prof...
Definition GaussFilter.h:47

OpenMS::GaussFilter::filter
void filter(MSSpectrum &spectrum)
Smoothes an MSSpectrum containing profile data.

OpenMS::MRMFeature
A multi-chromatogram MRM feature.
Definition MRMFeature.h:26

OpenMS::MRMFeature::getFeature
Feature & getFeature(const String &key)
get a specified feature

OpenMS::MRMTransitionGroup
The representation of a group of transitions in a targeted proteomics experiment.
Definition MRMTransitionGroup.h:42

OpenMS::MRMTransitionGroup::size
Size size() const
Definition MRMTransitionGroup.h:99

OpenMS::MRMTransitionGroup::getChromatograms
std::vector< ChromatogramType > & getChromatograms()
Definition MRMTransitionGroup.h:160

OpenMS::MSSpectrum
The representation of a 1D spectrum.
Definition MSSpectrum.h:44

OpenMS::Param
Management and storage of parameters / INI files.
Definition Param.h:46

OpenMS::Param::setValue
void setValue(const std::string &key, const ParamValue &value, const std::string &description="", const std::vector< std::string > &tags=std::vector< std::string >())
Sets a value.

OpenMS::Peak1D
A 1-dimensional raw data point or peak.
Definition Peak1D.h:30

OpenMS::Peak1D::setIntensity
void setIntensity(IntensityType intensity)
Mutable access to the data point intensity (height)
Definition Peak1D.h:86

OpenMS::Peak1D::setMZ
void setMZ(CoordinateType mz)
Mutable access to m/z.
Definition Peak1D.h:95

OpenMS::String
A more convenient string class.
Definition String.h:34

OpenMS::Size
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition Types.h:97

OPENMS_PRECONDITION
#define OPENMS_PRECONDITION(condition, message)
Precondition macro.
Definition openms/include/OpenMS/CONCEPT/Macros.h:94

OpenMS
Main OpenMS namespace.
Definition openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19