current_doxygen/html/ConfidenceScoring_8h_source.html

// Copyright (c) 2002-present, OpenMS Inc. -- EKU Tuebingen, ETH Zurich, and FU Berlin

// SPDX-License-Identifier: BSD-3-Clause

//

// --------------------------------------------------------------------------

// $Maintainer: Hendrik Weisser $

// $Authors: Hannes Roest, Hendrik Weisser $

// --------------------------------------------------------------------------


#pragma once


#include <cmath> // for "exp"

#include <limits> // for "infinity"

#include <map>


#include <OpenMS/CONCEPT/ProgressLogger.h>

#include <OpenMS/CONCEPT/LogStream.h>

#include <OpenMS/KERNEL/FeatureMap.h>

#include <OpenMS/ANALYSIS/MAPMATCHING/TransformationDescription.h>

#include <OpenMS/ANALYSIS/TARGETED/TargetedExperiment.h>


#include <OpenMS/MATH/MathFunctions.h>


namespace OpenMS

{


  class OPENMS_DLLAPI ConfidenceScoring :

      public ProgressLogger

  {

  public:


      explicit ConfidenceScoring(bool test_mode_ = false);


      ~ConfidenceScoring() override {}


  protected:


      struct GLM_

      {

        double intercept;

        double rt_coef;

        double int_coef;


        double operator()(double diff_rt, double dist_int) const

        {

          double lm = intercept + rt_coef * diff_rt * diff_rt +

            int_coef * dist_int;

          return 1.0 / (1.0 + exp(-lm));

        }


      } glm_;


      struct RTNorm_

      {

        double min_rt;

        double max_rt;


        double operator()(double rt) const

        {

          return (rt - min_rt) / (max_rt - min_rt) * 100;

        }


      } rt_norm_;


      TargetedExperiment library_;


      IntList decoy_index_;


      Size n_decoys_;


      std::map<std::string, IntList> transition_map_;


      Size n_transitions_;


      TransformationDescription rt_trafo_;


      Math::RandomShuffler shuffler_;


      void chooseDecoys_();


      double manhattanDist_(DoubleList x, DoubleList y);


      double getAssayRT_(const TargetedExperiment::Peptide& assay);


      double scoreAssay_(const TargetedExperiment::Peptide& assay,

                         double feature_rt, DoubleList& feature_intensities,

                         const std::set<std::string>& transition_ids = std::set<std::string>());


      void scoreFeature_(Feature& feature);


  public:


      void initialize(const TargetedExperiment& library, const Size n_decoys, const Size n_transitions, const TransformationDescription& rt_trafo)

      {

        library_ = library;

        n_decoys_ = n_decoys;

        n_transitions_ = n_transitions;

        rt_trafo_ = rt_trafo;

      }


      void initializeGlm(double intercept, double rt_coef, double int_coef)

      {

        glm_.intercept = intercept;

        glm_.rt_coef = rt_coef;

        glm_.int_coef = int_coef;

      }


      void scoreMap(FeatureMap & features)

      {

        // are there enough assays in the library?

        Size n_assays = library_.getPeptides().size();

        if (n_assays < 2)

        {

          throw Exception::IllegalArgument(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION,

                                           "There need to be at least 2 assays in the library for ConfidenceScoring.");


        }

        if (n_assays - 1 < n_decoys_)

        {

          OPENMS_LOG_WARN << "Warning: Parameter 'decoys' (" << n_decoys_

                   << ") is higher than the number of unrelated assays in the "

                   << "library (" << n_assays - 1 << "). "

                   << "Using all unrelated assays as decoys." << std::endl;

        }

        if (n_assays - 1 <= n_decoys_) n_decoys_ = 0; // use all available assays


        decoy_index_.resize(n_assays);

        for (Size i = 0; i < n_assays; ++i) decoy_index_[i] = boost::numeric_cast<Int>(i);


        // build mapping between assays and transitions:

        OPENMS_LOG_DEBUG << "Building transition map..." << std::endl;

        for (Size i = 0; i < library_.getTransitions().size(); ++i)

        {

          const std::string& ref = library_.getTransitions()[i].getPeptideRef();

          transition_map_[ref].push_back(boost::numeric_cast<Int>(i));

        }

        // find min./max. RT in the library:

        OPENMS_LOG_DEBUG << "Determining retention time range..." << std::endl;

        rt_norm_.min_rt = std::numeric_limits<double>::infinity();

        rt_norm_.max_rt = -std::numeric_limits<double>::infinity();

        for (std::vector<TargetedExperiment::Peptide>::const_iterator it =

               library_.getPeptides().begin(); it != library_.getPeptides().end();

             ++it)

        {

          double current_rt = getAssayRT_(*it);

          if (current_rt == -1.0) continue; // indicates a missing value

          rt_norm_.min_rt = std::min(rt_norm_.min_rt, current_rt);

          rt_norm_.max_rt = std::max(rt_norm_.max_rt, current_rt);

        }


        // log scoring progress:

        OPENMS_LOG_DEBUG << "Scoring features..." << std::endl;

        startProgress(0, features.size(), "scoring features");


        for (FeatureMap::Iterator feat_it = features.begin();

             feat_it != features.end(); ++feat_it)

        {

          OPENMS_LOG_DEBUG << "Feature " << feat_it - features.begin() + 1

                    << " (ID '" << feat_it->getUniqueId() << "')"<< std::endl;

          scoreFeature_(*feat_it);

          setProgress(feat_it - features.begin());

        }

        endProgress();


      }


  };


}

FeatureMap.h

LogStream.h

OPENMS_LOG_DEBUG
#define OPENMS_LOG_DEBUG
Macro for debug information - includes file and line info.
Definition LogStream.h:591

OPENMS_LOG_WARN
#define OPENMS_LOG_WARN
Macro for warnings.
Definition LogStream.h:583

MathFunctions.h

ProgressLogger.h

TargetedExperiment.h

TransformationDescription.h

OpenMS::ConfidenceScoring
Confidence scoring for SRM/MRM/PRM features against a targeted assay library.
Definition ConfidenceScoring.h:56

OpenMS::ConfidenceScoring::scoreMap
void scoreMap(FeatureMap &features)
Score every feature in features in place, writing per-feature scores and an updated overall-quality v...
Definition ConfidenceScoring.h:219

OpenMS::ConfidenceScoring::chooseDecoys_
void chooseDecoys_()
Permute decoy_index_ in place to pick a fresh random decoy sample for the next feature.

OpenMS::ConfidenceScoring::library_
TargetedExperiment library_
Targeted-assay library: one peptide per assay, each with its transitions.
Definition ConfidenceScoring.h:114

OpenMS::ConfidenceScoring::shuffler_
Math::RandomShuffler shuffler_
Random shuffler used to draw decoy samples (seed depends on test mode — see ctor)
Definition ConfidenceScoring.h:126

OpenMS::ConfidenceScoring::decoy_index_
IntList decoy_index_
Indexes into library_.getPeptides() used as decoys for the current feature.
Definition ConfidenceScoring.h:116

OpenMS::ConfidenceScoring::n_decoys_
Size n_decoys_
Number of decoy assays to sample per feature (0 = use all unrelated assays as decoys)
Definition ConfidenceScoring.h:118

OpenMS::ConfidenceScoring::getAssayRT_
double getAssayRT_(const TargetedExperiment::Peptide &assay)
Read the (single) retention time from an assay's TargetedExperiment::Peptide; the assay is required t...

OpenMS::ConfidenceScoring::~ConfidenceScoring
~ConfidenceScoring() override
Destructor.
Definition ConfidenceScoring.h:70

OpenMS::ConfidenceScoring::rt_trafo_
TransformationDescription rt_trafo_
Optional RT transformation applied to measured feature RTs before comparison with library RTs.
Definition ConfidenceScoring.h:124

OpenMS::ConfidenceScoring::scoreAssay_
double scoreAssay_(const TargetedExperiment::Peptide &assay, double feature_rt, DoubleList &feature_intensities, const std::set< std::string > &transition_ids=std::set< std::string >())
Score one feature against one candidate assay.

OpenMS::ConfidenceScoring::manhattanDist_
double manhattanDist_(DoubleList x, DoubleList y)
Manhattan (L1) distance between two equal-length vectors.

OpenMS::ConfidenceScoring::ConfidenceScoring
ConfidenceScoring(bool test_mode_=false)
Construct an empty scorer.

OpenMS::ConfidenceScoring::scoreFeature_
void scoreFeature_(Feature &feature)
Score one feature against its matching assay plus a random decoy sample; writes the per-assay scores ...

OpenMS::ConfidenceScoring::initializeGlm
void initializeGlm(double intercept, double rt_coef, double int_coef)
Install the GLM coefficients fitted externally on a training set.
Definition ConfidenceScoring.h:186

OpenMS::ConfidenceScoring::n_transitions_
Size n_transitions_
Number of top-intensity transitions to keep when computing the intensity-distance term (0 = keep all)
Definition ConfidenceScoring.h:122

OpenMS::ConfidenceScoring::transition_map_
std::map< std::string, IntList > transition_map_
Lookup assay-id -> indexes into library_.getTransitions()
Definition ConfidenceScoring.h:120

OpenMS::ConfidenceScoring::initialize
void initialize(const TargetedExperiment &library, const Size n_decoys, const Size n_transitions, const TransformationDescription &rt_trafo)
Install the configuration needed before scoreMap() can run.
Definition ConfidenceScoring.h:168

OpenMS::Exception::IllegalArgument
A method or algorithm argument contains illegal values.
Definition Exception.h:633

OpenMS::ExposedVector::size
size_t size() const noexcept
Definition ExposedVector.h:128

OpenMS::ExposedVector::begin
iterator begin() noexcept
Definition ExposedVector.h:104

OpenMS::ExposedVector::end
iterator end() noexcept
Definition ExposedVector.h:108

OpenMS::FeatureMap
A container for features.
Definition FeatureMap.h:78

OpenMS::FeatureMap::Iterator
iterator Iterator
Definition FeatureMap.h:85

OpenMS::Feature
An LC-MS feature.
Definition Feature.h:46

OpenMS::Math::RandomShuffler
Definition MathFunctions.h:478

OpenMS::ProgressLogger
Base class for all classes that want to report their progress.
Definition ProgressLogger.h:27

OpenMS::TargetedExperimentHelper::Peptide
Represents a peptide (amino acid sequence)
Definition TargetedExperimentHelper.h:335

OpenMS::TargetedExperiment
A description of a targeted experiment containing precursor and production ions.
Definition TargetedExperiment.h:40

OpenMS::TargetedExperiment::getTransitions
const std::vector< ReactionMonitoringTransition > & getTransitions() const
returns the transition list

OpenMS::TargetedExperiment::getPeptides
const std::vector< Peptide > & getPeptides() const

OpenMS::TransformationDescription
Generic description of a coordinate transformation.
Definition TransformationDescription.h:38

OpenMS::Size
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition Types.h:97

OpenMS::IntList
std::vector< Int > IntList
Vector of signed integers.
Definition TypeAliases.h:24

OpenMS::DoubleList
std::vector< double > DoubleList
Vector of double precision real types.
Definition TypeAliases.h:31

OpenMS
Main OpenMS namespace.
Definition openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19

OpenMS::ConfidenceScoring::GLM_
Binomial GLM used to map (squared-normalised-RT-diff, intensity-distance) -> [0, 1] confidence.
Definition ConfidenceScoring.h:81

OpenMS::ConfidenceScoring::GLM_::rt_coef
double rt_coef
GLM coefficient on the squared RT difference (units: 1/RT²)
Definition ConfidenceScoring.h:83

OpenMS::ConfidenceScoring::GLM_::int_coef
double int_coef
GLM coefficient on the Manhattan intensity distance.
Definition ConfidenceScoring.h:84

OpenMS::ConfidenceScoring::GLM_::operator()
double operator()(double diff_rt, double dist_int) const
Evaluate the GLM at (diff_rt, dist_int); returns a probability in [0, 1].
Definition ConfidenceScoring.h:87

OpenMS::ConfidenceScoring::GLM_::intercept
double intercept
GLM intercept term.
Definition ConfidenceScoring.h:82

OpenMS::ConfidenceScoring::RTNorm_
Map RT values into the [0, 100] interval using min/max RT of the assay library.
Definition ConfidenceScoring.h:103

OpenMS::ConfidenceScoring::RTNorm_::min_rt
double min_rt
Smallest assay RT in the library; set by scoreMap()
Definition ConfidenceScoring.h:104

OpenMS::ConfidenceScoring::RTNorm_::max_rt
double max_rt
Largest assay RT in the library; set by scoreMap()
Definition ConfidenceScoring.h:105

OpenMS::ConfidenceScoring::RTNorm_::operator()
double operator()(double rt) const
Map rt into [0, 100] using the cached min/max library RTs.
Definition ConfidenceScoring.h:108