OpenMS
Loading...
Searching...
No Matches
PeptideAndProteinQuant.h
Go to the documentation of this file.
1// Copyright (c) 2002-present, OpenMS Inc. -- EKU Tuebingen, ETH Zurich, and FU Berlin
2// SPDX-License-Identifier: BSD-3-Clause
3//
4// --------------------------------------------------------------------------
5// $Maintainer: Hendrik Weisser $
6// $Authors: Hendrik Weisser $
7// --------------------------------------------------------------------------
8
9#pragma once
10
18
19
20namespace OpenMS
21{
29 class OPENMS_DLLAPI PeptideAndProteinQuant :
31 {
32public:
33
35 typedef std::map<UInt64, double> SampleAbundances;
36
39 {
41 std::map<Int, std::map<std::string, std::map<Int, std::map<UInt, double>>>> abundances;
42
44 std::map<Int, std::map<std::string, std::map<Int, UInt64>>> psm_counts;
45
48
51
53 std::set<std::string> accessions;
54
56 Size psm_count = 0;
57
59 PeptideData() = default;
60 };
61
63 typedef std::map<AASequence, PeptideData> PeptideQuant;
64
67 {
69 std::map<std::string, SampleAbundances> peptide_abundances;
70
71 std::map<std::string, SampleAbundances> peptide_psm_counts;
72
74 std::map<std::string, std::map<UInt, double>> channel_level_abundances;
75
77 std::map<std::string, UInt64> file_level_psm_counts;
78
81
84
87
89 Size psm_count = 0;
90
92 ProteinData() = default;
93 };
94
96 typedef std::map<std::string, ProteinData> ProteinQuant;
97
100 {
103
106
109
111 Size quant_proteins, too_few_peptides;
112
114 Size quant_peptides, total_peptides;
115
117 Size quant_features, total_features, blank_features, ambig_features;
118
121 n_samples(0), quant_proteins(0), too_few_peptides(0),
122 quant_peptides(0), total_peptides(0), quant_features(0),
123 total_features(0), blank_features(0), ambig_features(0) {}
124 };
125
128
131
137 void readQuantData(FeatureMap& features, const ExperimentalDesign& ed);
138
144 void readQuantData(ConsensusMap& consensus, const ExperimentalDesign& ed);
145
151 void readQuantData(std::vector<ProteinIdentification>& proteins,
153 const ExperimentalDesign& ed);
154
166
167
176
177
178 std::map<std::string, std::string> mapAccessionToLeader(const OpenMS::ProteinIdentification& proteins) const;
179
182
185
188
191 const ProteinQuant& protein_quants,
192 ProteinIdentification& proteins,
193 bool remove_unquantified = true);
194
195private:
196
199
202
205
208
209
217
228 void quantifyFeature_(const FeatureHandle& feature,
229 size_t fraction,
230 const std::string& filename,
231 const PeptideHit& hit,
232 UInt channel_or_label);
233
242 const std::map<Int, std::map<std::string, std::map<Int, std::map<UInt, double>>>> & peptide_abundances,
243 std::tuple<size_t, std::string, size_t, UInt> & best);
244
250 template <typename T>
251 void orderBest_(const std::map<T, SampleAbundances> & abundances,
252 std::vector<T>& result)
253 {
254 typedef std::pair<Size, double> PairType;
255 std::multimap<PairType, T, std::greater<PairType> > order;
256 for (typename std::map<T, SampleAbundances>::const_iterator ab_it =
257 abundances.begin(); ab_it != abundances.end(); ++ab_it)
258 {
259 double total = 0.0;
260 for (SampleAbundances::const_iterator samp_it = ab_it->second.begin();
261 samp_it != ab_it->second.end(); ++samp_it)
262 {
263 total += samp_it->second;
264 }
265 if (total <= 0.0) continue; // not quantified
266 PairType key = std::make_pair(ab_it->second.size(), total);
267 order.insert(std::make_pair(key, ab_it->first));
268 }
269 result.clear();
270 for (typename std::multimap<PairType, T, std::greater<PairType> >::
271 iterator ord_it = order.begin(); ord_it != order.end(); ++ord_it)
272 {
273 result.push_back(ord_it->second);
274 }
275 }
276
277
278
283
292
301 std::vector<std::string> selectPeptidesForQuantification_(const std::string& protein_accession,
302 Size top_n,
303 bool fix_peptides);
304
312 double aggregateAbundances_(const std::vector<double>& abundances,
313 const std::string& method) const;
314
324 void calculateProteinAbundances_(const std::string& protein_accession,
325 const std::vector<std::string>& selected_peptides,
326 const std::string& aggregate_method,
327 Size top_n,
328 bool include_all);
329
340 void calculateFileAndChannelLevelProteinAbundances_(const std::string& protein_accession,
341 const std::vector<std::string>& selected_peptides,
342 const std::string& aggregate_method,
343 Size top_n,
344 bool include_all,
345 const std::map<std::string, std::string>& accession_to_leader);
346
353
366 std::string getAccession_(const std::set<std::string>& pep_accessions,
367 const std::map<std::string, std::string>& accession_to_leader) const;
368
375
384 size_t getSampleIDFromFilenameAndChannel_(const std::string& filename,
385 UInt channel_or_label,
386 const ExperimentalDesign& ed) const;
387
389 void updateMembers_() override;
390
391 }; // class
392
393} // namespace
A container for consensus elements.
Definition ConsensusMap.h:67
A base class for all classes handling default parameters.
Definition DefaultParamHandler.h:66
Representation of an experimental design in OpenMS. Instances can be loaded with the ExperimentalDesi...
Definition ExperimentalDesign.h:109
Representation of a Peak2D, RichPeak2D or Feature .
Definition FeatureHandle.h:36
A container for features.
Definition FeatureMap.h:78
Helper class for peptide and protein quantification based on feature data annotated with IDs.
Definition PeptideAndProteinQuant.h:31
void readQuantData(ConsensusMap &consensus, const ExperimentalDesign &ed)
Read quantitative data from a consensus map.
void annotateQuantificationsToProteins(const ProteinQuant &protein_quants, ProteinIdentification &proteins, bool remove_unquantified=true)
Annotate protein quant results as meta data to protein ids.
std::map< AASequence, PeptideData > PeptideQuant
Mapping: peptide sequence (modified) -> peptide data.
Definition PeptideAndProteinQuant.h:63
void readQuantData(FeatureMap &features, const ExperimentalDesign &ed)
Read quantitative data from a feature map.
ExperimentalDesign experimental_design_
Experimental design for filename/channel to sample mapping.
Definition PeptideAndProteinQuant.h:207
std::map< std::string, ProteinData > ProteinQuant
Mapping: protein accession -> protein data.
Definition PeptideAndProteinQuant.h:96
double aggregateAbundances_(const std::vector< double > &abundances, const std::string &method) const
Aggregate abundances using the specified mathematical method.
std::vector< std::string > selectPeptidesForQuantification_(const std::string &protein_accession, Size top_n, bool fix_peptides)
Select peptides for protein quantification based on filtering criteria.
void quantifyFeature_(const FeatureHandle &feature, size_t fraction, const std::string &filename, const PeptideHit &hit, UInt channel_or_label)
Gather quantitative information from a feature.
const PeptideQuant & getPeptideResults()
Get peptide abundance data.
void performIbaqNormalization_(const ProteinIdentification &proteins)
Perform iBAQ normalization on protein abundances.
std::map< std::string, std::string > mapAccessionToLeader(const OpenMS::ProteinIdentification &proteins) const
bool getBest_(const std::map< Int, std::map< std::string, std::map< Int, std::map< UInt, double > > > > &peptide_abundances, std::tuple< size_t, std::string, size_t, UInt > &best)
Determine fraction, filename, charge state, and channel of a peptide with the highest number of abund...
void countPeptides_(PeptideIdentificationList &peptides)
Count the number of identifications (best hits only) of each peptide sequence.
void quantifyPeptides(const PeptideIdentificationList &peptides=PeptideIdentificationList())
Compute peptide abundances.
size_t getSampleIDFromFilenameAndChannel_(const std::string &filename, UInt channel_or_label, const ExperimentalDesign &ed) const
Map (filename, channel) to sample using ExperimentalDesign.
PeptideQuant pep_quant_
Peptide quantification data.
Definition PeptideAndProteinQuant.h:201
void transferPeptideDataToProteins_(const ProteinIdentification &proteins)
Transfer peptide-level quantitative data to protein-level data structures.
~PeptideAndProteinQuant() override
Destructor.
Definition PeptideAndProteinQuant.h:130
std::string getAccession_(const std::set< std::string > &pep_accessions, const std::map< std::string, std::string > &accession_to_leader) const
Get the "canonical" protein accession from the list of protein accessions of a peptide.
void readQuantData(std::vector< ProteinIdentification > &proteins, PeptideIdentificationList &peptides, const ExperimentalDesign &ed)
Read quantitative data from identification results (for quantification via spectral counting).
void updateMembers_() override
Clear all data when parameters are set.
const ProteinQuant & getProteinResults()
Get protein abundance data.
void normalizePeptides_()
Normalize peptide abundances across samples by (multiplicative) scaling to equal medians.
void calculateFileAndChannelLevelProteinAbundances_(const std::string &protein_accession, const std::vector< std::string > &selected_peptides, const std::string &aggregate_method, Size top_n, bool include_all, const std::map< std::string, std::string > &accession_to_leader)
Calculate detailed protein abundances at channel level using selected peptides.
void quantifyProteins(const ProteinIdentification &proteins=ProteinIdentification())
Compute protein abundances.
Statistics stats_
Processing statistics for output in the end.
Definition PeptideAndProteinQuant.h:198
const Statistics & getStatistics()
Get summary statistics.
void calculateProteinAbundances_(const std::string &protein_accession, const std::vector< std::string > &selected_peptides, const std::string &aggregate_method, Size top_n, bool include_all)
Calculate protein abundances for a single protein using selected peptides.
PeptideHit getAnnotation_(PeptideIdentificationList &peptides)
Get the "canonical" annotation (a single peptide hit) of a feature/consensus feature from the associa...
void orderBest_(const std::map< T, SampleAbundances > &abundances, std::vector< T > &result)
Order keys (charges/peptides for peptide/protein quantification) according to how many samples they a...
Definition PeptideAndProteinQuant.h:251
std::map< UInt64, double > SampleAbundances
Mapping: sample ID -> abundance.
Definition PeptideAndProteinQuant.h:35
ProteinQuant prot_quant_
Protein quantification data.
Definition PeptideAndProteinQuant.h:204
PeptideAndProteinQuant()
Constructor.
Represents a single spectrum match (candidate) for a specific tandem mass spectrum (MS/MS).
Definition PeptideHit.h:52
Container for peptide identifications from multiple spectra.
Definition PeptideIdentificationList.h:66
Representation of a protein identification run.
Definition ProteinIdentification.h:55
int Int
Signed integer type.
Definition Types.h:72
unsigned int UInt
Unsigned integer type.
Definition Types.h:64
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition Types.h:97
Main OpenMS namespace.
Definition openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19
Quantitative and associated data for a peptide.
Definition PeptideAndProteinQuant.h:39
std::map< Int, std::map< std::string, std::map< Int, UInt64 > > > psm_counts
mapping: fraction -> filename -> charge -> abundance
Definition PeptideAndProteinQuant.h:44
SampleAbundances total_psm_counts
spectral counting-based abundances
Definition PeptideAndProteinQuant.h:50
SampleAbundances total_abundances
mapping: sample -> total abundance
Definition PeptideAndProteinQuant.h:47
std::map< Int, std::map< std::string, std::map< Int, std::map< UInt, double > > > > abundances
mapping: fraction -> filename -> charge -> channel/label -> abundance
Definition PeptideAndProteinQuant.h:41
std::set< std::string > accessions
protein accessions for this peptide
Definition PeptideAndProteinQuant.h:53
Quantitative and associated data for a protein.
Definition PeptideAndProteinQuant.h:67
SampleAbundances total_psm_counts
spectral counting-based abundances
Definition PeptideAndProteinQuant.h:83
std::map< std::string, SampleAbundances > peptide_psm_counts
Definition PeptideAndProteinQuant.h:71
SampleAbundances total_abundances
mapping: sample -> total abundance
Definition PeptideAndProteinQuant.h:80
std::map< std::string, std::map< UInt, double > > channel_level_abundances
mapping: filename -> channel/label -> abundance
Definition PeptideAndProteinQuant.h:74
std::map< std::string, SampleAbundances > peptide_abundances
mapping: peptide (unmodified) -> sample -> abundance
Definition PeptideAndProteinQuant.h:69
std::map< std::string, UInt64 > file_level_psm_counts
mapping: filename -> PSM counts
Definition PeptideAndProteinQuant.h:77
SampleAbundances total_distinct_peptides
number of distinct peptide sequences
Definition PeptideAndProteinQuant.h:86
Statistics for processing summary.
Definition PeptideAndProteinQuant.h:100
Size quant_proteins
protein statistics
Definition PeptideAndProteinQuant.h:111
Size quant_peptides
peptide statistics
Definition PeptideAndProteinQuant.h:114
Size n_samples
number of samples (or assays in mzTab terms)
Definition PeptideAndProteinQuant.h:102
Size n_fractions
number of fractions
Definition PeptideAndProteinQuant.h:105
Statistics()
constructor
Definition PeptideAndProteinQuant.h:120
Size n_ms_files
number of MS files
Definition PeptideAndProteinQuant.h:108
Size ambig_features
Definition PeptideAndProteinQuant.h:117