9 #ifndef OPENMS_TRANSFORMATIONS_FEATUREFINDER_FEATUREFINDERIDENTIFICATIONALGORITHM_H
10 #define OPENMS_TRANSFORMATIONS_FEATUREFINDER_FEATUREFINDERIDENTIFICATIONALGORITHM_H
26 class IsotopeDistribution;
50 std::vector<PeptideIdentification> peptides,
51 const std::vector<ProteinIdentification>& proteins,
52 std::vector<PeptideIdentification> peptides_ext,
53 std::vector<ProteinIdentification> proteins_ext,
56 const String& spectra_file =
""
83 typedef std::multimap<double, PeptideIdentification*>
RTMap;
85 typedef std::map<Int, std::pair<RTMap, RTMap> >
ChargeMap;
143 } feature_filter_quality_;
152 } feature_filter_peptides_;
160 const String& seq1 = p1.
getHits()[0].getSequence().toString();
161 const String& seq2 = p2.
getHits()[0].getSequence().toString();
166 if (charge1 == charge2)
170 return charge1 < charge2;
196 double add_mass_offset_peptides_{0.0};
201 const double seed_rt_window_ = 60.0;
227 std::map<
Size, std::vector<PeptideIdentification*> >& feat_ids,
250 bool external =
false);
255 std::map<Size, double>& training_labels);
262 const double quality_cutoff);
276 template <
typename It>
277 std::vector<std::pair<It,It>>
278 chunk_(It range_from, It range_to,
const std::ptrdiff_t batch_size)
283 using std::make_pair;
285 using diff_t = std::ptrdiff_t;
288 const diff_t total {distance(range_from, range_to)};
289 const diff_t num {total / batch_size};
291 vector<pair<It,It>> chunks(num);
293 It batch_end {range_from};
296 std::generate(begin(chunks), end(chunks), [&batch_end, batch_size]()
298 It batch_start {batch_end };
300 std::advance(batch_end, batch_size);
301 return make_pair(batch_start, batch_end);
307 chunks.emplace_back(range_from, range_to);
311 chunks.back().second = range_to;
const std::vector< PeptideIdentification > & getPeptideIdentifications() const
A base class for all classes handling default parameters.
Definition: DefaultParamHandler.h:66
Definition: FeatureFinderIdentificationAlgorithm.h:32
FeatureFinderAlgorithmPickedHelperStructs::MassTraces MassTraces
Definition: FeatureFinderIdentificationAlgorithm.h:80
const PeakMap & getMSData() const
void postProcess_(FeatureMap &features, bool with_external_ids)
const PeakMap & getChromatograms() const
double rt_window_
RT window width.
Definition: FeatureFinderIdentificationAlgorithm.h:97
void getRTRegions_(ChargeMap &peptide_data, std::vector< RTRegion > &rt_regions, bool clear_IDs=true) const
get regions in which peptide eludes (ideally only one) by clustering RT elution times
void runOnCandidates(FeatureMap &features)
std::map< AASequence, ChargeMap > PeptideMap
mapping: sequence -> charge -> internal/external ID information
Definition: FeatureFinderIdentificationAlgorithm.h:87
const TargetedExperiment & getLibrary() const
void run(std::vector< PeptideIdentification > peptides, const std::vector< ProteinIdentification > &proteins, std::vector< PeptideIdentification > peptides_ext, std::vector< ProteinIdentification > proteins_ext, FeatureMap &features, const FeatureMap &seeds=FeatureMap(), const String &spectra_file="")
void createAssayLibrary_(const PeptideMap::iterator &begin, const PeptideMap::iterator &end, PeptideRefRTMap &ref_rt_map, bool clear_IDs=true)
String svm_xval_out_
Definition: FeatureFinderIdentificationAlgorithm.h:117
String elution_model_
Definition: FeatureFinderIdentificationAlgorithm.h:112
PeptideMap peptide_map_
Definition: FeatureFinderIdentificationAlgorithm.h:91
void filterFeaturesFinalizeAssay_(Feature &best_feature, double best_quality, const double quality_cutoff)
double end
Definition: FeatureFinderIdentificationAlgorithm.h:132
PeakMap & getChromatograms()
MRMFeatureFinderScoring feat_finder_
OpenSWATH feature finder.
Definition: FeatureFinderIdentificationAlgorithm.h:212
FeatureFinderIdentificationAlgorithm()
default constructor
ProgressLogger & getProgressLogger()
void filterFeatures_(FeatureMap &features, bool classified)
Size n_external_peps_
number of external peptides
Definition: FeatureFinderIdentificationAlgorithm.h:94
double signal_to_noise_
Definition: FeatureFinderIdentificationAlgorithm.h:110
void generateTransitions_(const String &peptide_id, double mz, Int charge, const IsotopeDistribution &iso_dist)
generate transitions (isotopic traces) for a peptide ion and add them to the library:
const ProgressLogger & getProgressLogger() const
TransformationDescription trafo_external_
TransformationDescription trafo_; // RT transformation (to range 0-1)
Definition: FeatureFinderIdentificationAlgorithm.h:210
bool quantify_decoys_
Definition: FeatureFinderIdentificationAlgorithm.h:195
TargetedExperiment library_
accumulated assays for peptides
Definition: FeatureFinderIdentificationAlgorithm.h:193
void annotateFeaturesFinalizeAssay_(FeatureMap &features, std::map< Size, std::vector< PeptideIdentification * > > &feat_ids, RTMap &rt_internal)
double min_peak_width_
Definition: FeatureFinderIdentificationAlgorithm.h:109
void calculateFDR_(FeatureMap &features)
void getRandomSample_(std::map< Size, double > &training_labels) const
StringList svm_predictor_names_
Definition: FeatureFinderIdentificationAlgorithm.h:116
std::vector< PeptideIdentification > unassignedIDs_
Definition: FeatureFinderIdentificationAlgorithm.h:199
void getUnbiasedSample_(const std::multimap< double, std::pair< Size, bool > > &valid_obs, std::map< Size, double > &training_labels)
void setMSData(const PeakMap &ms_data)
set the MS data used for feature detection
std::map< Int, std::pair< RTMap, RTMap > > ChargeMap
mapping: charge -> internal/external: (RT -> pointer to peptide)
Definition: FeatureFinderIdentificationAlgorithm.h:85
Size svm_n_parts_
number of partitions for SVM cross-validation
Definition: FeatureFinderIdentificationAlgorithm.h:119
Size svm_n_samples_
number of samples for SVM training
Definition: FeatureFinderIdentificationAlgorithm.h:120
Size n_internal_peps_
number of internal peptide
Definition: FeatureFinderIdentificationAlgorithm.h:93
Size addSeeds_(std::vector< PeptideIdentification > &peptides, const FeatureMap &seeds)
Size n_internal_features_
internal feature counter (for FDR calculation)
Definition: FeatureFinderIdentificationAlgorithm.h:207
ProgressLogger prog_log_
Definition: FeatureFinderIdentificationAlgorithm.h:214
PeakMap ms_data_
input LC-MS data
Definition: FeatureFinderIdentificationAlgorithm.h:191
void statistics_(const FeatureMap &features) const
some statistics on detected features
void setMSData(PeakMap &&ms_data)
Size addOffsetPeptides_(std::vector< PeptideIdentification > &peptides, double offset)
Size batch_size_
nr of peptides to use at the same time during chromatogram extraction
Definition: FeatureFinderIdentificationAlgorithm.h:96
double mz_window_
m/z window width
Definition: FeatureFinderIdentificationAlgorithm.h:98
double svm_min_prob_
Definition: FeatureFinderIdentificationAlgorithm.h:115
std::map< String, double > isotope_probs_
isotope probabilities of transitions
Definition: FeatureFinderIdentificationAlgorithm.h:211
void checkNumObservations_(Size n_pos, Size n_neg, const String ¬e="") const
double peak_width_
Definition: FeatureFinderIdentificationAlgorithm.h:108
Size n_external_features_
Definition: FeatureFinderIdentificationAlgorithm.h:208
FeatureFinderAlgorithmPickedHelperStructs::MassTrace MassTrace
Definition: FeatureFinderIdentificationAlgorithm.h:79
Size n_isotopes_
number of isotopes for peptide assay
Definition: FeatureFinderIdentificationAlgorithm.h:104
double mapping_tolerance_
RT tolerance for mapping IDs to features.
Definition: FeatureFinderIdentificationAlgorithm.h:101
std::map< String, std::pair< RTMap, RTMap > > PeptideRefRTMap
mapping: peptide ref. -> int./ext.: (RT -> pointer to peptide)
Definition: FeatureFinderIdentificationAlgorithm.h:89
Size debug_level_
Definition: FeatureFinderIdentificationAlgorithm.h:125
double rt_quantile_
Definition: FeatureFinderIdentificationAlgorithm.h:106
std::vector< std::pair< It, It > > chunk_(It range_from, It range_to, const std::ptrdiff_t batch_size)
Definition: FeatureFinderIdentificationAlgorithm.h:278
std::multiset< double > svm_probs_external_
SVM probabilities for "external" features (for FDR calculation):
Definition: FeatureFinderIdentificationAlgorithm.h:206
ChargeMap ids
internal/external peptide IDs (per charge) in this region
Definition: FeatureFinderIdentificationAlgorithm.h:133
bool mz_window_ppm_
m/z window width is given in PPM (not Da)?
Definition: FeatureFinderIdentificationAlgorithm.h:99
void updateMembers_() override
This method is used to update extra member variables at the end of the setParameters() method.
bool use_psm_cutoff_
Definition: FeatureFinderIdentificationAlgorithm.h:197
void classifyFeatures_(FeatureMap &features)
void addPeptideRT_(TargetedExperiment::Peptide &peptide, double rt) const
PeakMap chrom_data_
accumulated chromatograms (XICs)
Definition: FeatureFinderIdentificationAlgorithm.h:192
void ensureConvexHulls_(Feature &feature) const
std::multimap< double, PeptideIdentification * > RTMap
mapping: RT (not necessarily unique) -> pointer to peptide
Definition: FeatureFinderIdentificationAlgorithm.h:83
TargetedExperiment & getLibrary()
void addPeptideToMap_(PeptideIdentification &peptide, PeptideMap &peptide_map, bool external=false)
double psm_score_cutoff_
Definition: FeatureFinderIdentificationAlgorithm.h:198
void annotateFeatures_(FeatureMap &features, PeptideRefRTMap &ref_rt_map)
annotate identified features with m/z, isotope probabilities, etc.
String candidates_out_
Definition: FeatureFinderIdentificationAlgorithm.h:123
double isotope_pmin_
min. isotope probability for peptide assay
Definition: FeatureFinderIdentificationAlgorithm.h:103
double svm_quality_cutoff
Definition: FeatureFinderIdentificationAlgorithm.h:118
std::map< double, std::pair< Size, Size > > svm_probs_internal_
SVM probability -> number of pos./neg. features (for FDR calculation):
Definition: FeatureFinderIdentificationAlgorithm.h:204
region in RT in which a peptide elutes:
Definition: FeatureFinderIdentificationAlgorithm.h:131
A container for features.
Definition: FeatureMap.h:80
An LC-MS feature.
Definition: Feature.h:46
QualityType getOverallQuality() const
Non-mutable access to the overall quality.
Definition: IsotopeDistribution.h:39
The MRMFeatureFinder finds and scores peaks of transitions that co-elute.
Definition: MRMFeatureFinderScoring.h:66
In-Memory representation of a mass spectrometry run.
Definition: MSExperiment.h:46
CoordinateType getRT() const
Returns the RT coordinate (index 0)
Definition: Peak2D.h:184
Represents the peptide hits for a spectrum.
Definition: PeptideIdentification.h:39
double getRT() const
returns the RT of the MS2 spectrum where the identification occurred
const std::vector< PeptideHit > & getHits() const
returns the peptide hits as const
Base class for all classes that want to report their progress.
Definition: ProgressLogger.h:27
A more convenient string class.
Definition: String.h:34
Represents a peptide (amino acid sequence)
Definition: TargetedExperimentHelper.h:334
A description of a targeted experiment containing precursor and production ions.
Definition: TargetedExperiment.h:39
int Int
Signed integer type.
Definition: Types.h:76
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:101
std::vector< String > StringList
Vector of String.
Definition: ListUtils.h:44
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:22
Helper struct for mass traces used in FeatureFinderAlgorithmPicked.
Definition: FeatureFinderAlgorithmPickedHelperStructs.h:54
Helper struct for a collection of mass traces used in FeatureFinderAlgorithmPicked.
Definition: FeatureFinderAlgorithmPickedHelperStructs.h:85
comparison functor for features
Definition: FeatureFinderIdentificationAlgorithm.h:178
bool operator()(const Feature &f1, const Feature &f2)
Definition: FeatureFinderIdentificationAlgorithm.h:179
predicate for filtering features by assigned peptides:
Definition: FeatureFinderIdentificationAlgorithm.h:147
bool operator()(const Feature &feature)
Definition: FeatureFinderIdentificationAlgorithm.h:148
predicate for filtering features by overall quality:
Definition: FeatureFinderIdentificationAlgorithm.h:138
bool operator()(const Feature &feature)
Definition: FeatureFinderIdentificationAlgorithm.h:139
comparison functor for (unassigned) peptide IDs
Definition: FeatureFinderIdentificationAlgorithm.h:156
bool operator()(const PeptideIdentification &p1, const PeptideIdentification &p2)
Definition: FeatureFinderIdentificationAlgorithm.h:157