OpenMS
Loading...
Searching...
No Matches
IDFilter.h
Go to the documentation of this file.
1// Copyright (c) 2002-present, OpenMS Inc. -- EKU Tuebingen, ETH Zurich, and FU Berlin
2// SPDX-License-Identifier: BSD-3-Clause
3//
4// --------------------------------------------------------------------------
5// $Maintainer: Mathias Walzer $
6// $Authors: Nico Pfeifer, Mathias Walzer, Hendrik Weisser $
7// --------------------------------------------------------------------------
8
9#pragma once
10
24#include <OpenMS/config.h>
25#include <algorithm>
26#include <climits>
27#include <functional>
28#include <map>
29#include <set>
30#include <unordered_set>
31#include <vector>
32
33namespace OpenMS
34{
35 template<typename T>
37 std::is_same_v<T, PeptideIdentification> || std::is_same_v<T, ProteinIdentification>;
38
39 template<typename T>
41 std::is_same_v<T, FeatureMap> || std::is_same_v<T, ConsensusMap>;
42
44 template<typename T>
46 !std::is_same_v<T, std::vector<PeptideIdentification>> &&
47 !std::is_same_v<T, std::vector<ProteinIdentification>> &&
48 !std::is_same_v<T, PeptideIdentificationList>;
49
70 class OPENMS_DLLAPI IDFilter
71 {
72 public:
74 IDFilter() = default;
75
77 virtual ~IDFilter() = default;
78
80 typedef std::map<Int, PeptideHit*> ChargeToPepHitP;
81 typedef std::unordered_map<std::string, ChargeToPepHitP> SequenceToChargeToPepHitP;
82 typedef std::map<std::string, SequenceToChargeToPepHitP> RunToSequenceToChargeToPepHitP;
83
90
92 template<class HitType>
93 struct HasGoodScore {
94 typedef HitType argument_type; // for use as a predicate
95
96 double score;
98
99 HasGoodScore(double score_, bool higher_score_better_) : score(score_), higher_score_better(higher_score_better_)
100 {
101 }
102
103 bool operator()(const HitType& hit) const
104 {
105 if (higher_score_better)
106 {
107 return hit.getScore() >= score;
108 }
109 return hit.getScore() <= score;
110 }
111 };
112
118 template<class HitType>
120 typedef HitType argument_type; // for use as a predicate
121
124
125 HasMetaValue(const String& key_, const DataValue& value_) : key(key_), value(value_)
126 {
127 }
128
129 bool operator()(const HitType& hit) const
130 {
131 DataValue found = hit.getMetaValue(key);
132 if (found.isEmpty())
133 return false; // meta value "key" not set
134 if (value.isEmpty())
135 return true; // "key" is set, value doesn't matter
136 return found == value;
137 }
138 };
139
141 template<class HitType>
143 typedef HitType argument_type; // for use as a predicate
144
146 double value;
147
148 HasMaxMetaValue(const String& key_, const double& value_) : key(key_), value(value_)
149 {
150 }
151
152 bool operator()(const HitType& hit) const
153 {
154 DataValue found = hit.getMetaValue(key);
155 if (found.isEmpty())
156 return false; // meta value "key" not set
157 return double(found) <= value;
158 }
159 };
160
168 template<class HitType>
170 {
171 typedef HitType argument_type; // for use as a predicate
172
174 double value;
175
182 HasMinMetaValue(const String& key_, const double& value_) :
183 key(key_),
184 value(value_)
185 {
186 }
187
194 bool operator()(const HitType& hit) const
195 {
196 DataValue found = hit.getMetaValue(key);
197 if (found.isEmpty())
198 {
199 return false; // meta value "key" not set
200 }
201 return static_cast<double>(found) >= value;
202 }
203 };
204
206
221 template<class HitType>
223 {
224 typedef HitType argument_type; // for use as a predicate
225
226 struct HasMetaValue<HitType> target_decoy, is_decoy;
227
234 target_decoy("target_decoy", "decoy"),
235 is_decoy("isDecoy", "true")
236 {
237 }
238
247 bool operator()(const HitType& hit) const
248 {
249 // @TODO: this could be done slightly more efficiently by returning
250 // false if the "target_decoy" meta value is "target" or "target+decoy",
251 // without checking for an "isDecoy" meta value in that case
252 return target_decoy(hit) || is_decoy(hit);
253 }
254 };
255
264 template<class HitType, class SetType>
266 typedef HitType argument_type; // for use as a predicate
267
268 const SetType& accessions;
269
270 explicit HasMatchingAccessionImpl(const SetType& accessions_) : accessions(accessions_)
271 {
272 }
273
274 bool operator()(const PeptideHit& hit) const
275 {
276 for (const auto& acc : hit.extractProteinAccessionsSet())
277 {
278 if (accessions.count(acc) > 0)
279 return true;
280 }
281 return false;
282 }
283
284 bool operator()(const ProteinHit& hit) const
285 {
286 return accessions.count(hit.getAccession()) > 0;
287 }
288
289 bool operator()(const PeptideEvidence& evidence) const
290 {
291 return accessions.count(evidence.getProteinAccession()) > 0;
292 }
293 };
294
296 template<class HitType>
298
300 template<class HitType>
302
308 template<class HitType, class Entry>
310 typedef HitType argument_type; // for use as a predicate
311 typedef std::map<String, Entry*> ItemMap; // Store pointers to avoid copying data
313
314 GetMatchingItems(std::vector<Entry>& records)
315 {
316 for (typename std::vector<Entry>::iterator rec_it = records.begin(); rec_it != records.end(); ++rec_it)
317 {
318 items[getKey(*rec_it)] = &(*rec_it);
319 }
320 }
321
323 {
324 }
325
326 const String& getKey(const FASTAFile::FASTAEntry& entry) const
327 {
328 return entry.identifier;
329 }
330
331 bool exists(const HitType& hit) const
332 {
333 return items.count(getHitKey(hit)) > 0;
334 }
335
336 const String& getHitKey(const PeptideEvidence& p) const
337 {
338 return p.getProteinAccession();
339 }
340
341 const Entry& getValue(const PeptideEvidence& evidence) const
342 {
343 if (!exists(evidence))
344 {
345 throw Exception::InvalidParameter(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, "Accession: '" + getHitKey(evidence) + "'. peptide evidence accession not in data");
346 }
347 return *(items.find(getHitKey(evidence))->second);
348 }
349 };
350
352
353
360
362 struct HasMinPeptideLength;
363
365 struct HasMinCharge;
366
368 struct HasLowMZError;
369
375 struct HasMatchingModification;
376
382 struct HasMatchingSequence;
383
385 struct HasNoEvidence;
386
387
394 {
395 private:
399
400 public:
402 PeptideDigestionFilter(EnzymaticDigestion& digestion, Int min, Int max) : digestion_(digestion), min_cleavages_(min), max_cleavages_(max)
403 {
404 }
405
406 static inline Int disabledValue()
407 {
408 return -1;
409 }
410
413 bool operator()(PeptideHit& p) const
414 {
415 const auto& fun = [&](const Int missed_cleavages) {
416 bool max_filter = max_cleavages_ != disabledValue() ? missed_cleavages > max_cleavages_ : false;
417 bool min_filter = min_cleavages_ != disabledValue() ? missed_cleavages < min_cleavages_ : false;
418 return max_filter || min_filter;
419 };
420 return digestion_.filterByMissedCleavages(p.getSequence().toUnmodifiedString(), fun);
421 }
422
423 void filterPeptideSequences(std::vector<PeptideHit>& hits)
424 {
425 hits.erase(std::remove_if(hits.begin(), hits.end(), (*this)), hits.end());
426 }
427 };
428
429
437
438 // Build an accession index to avoid the linear search cost
443
444 DigestionFilter(std::vector<FASTAFile::FASTAEntry>& entries, ProteaseDigestion& digestion, bool ignore_missed_cleavages, bool methionine_cleavage) :
445 accession_resolver_(entries), digestion_(digestion), ignore_missed_cleavages_(ignore_missed_cleavages), methionine_cleavage_(methionine_cleavage)
446 {
447 }
448
449 bool operator()(const PeptideEvidence& evidence) const
450 {
451 if (!evidence.hasValidLimits())
452 {
453 OPENMS_LOG_WARN << "Invalid limits! Peptide '" << evidence.getProteinAccession() << "' not filtered" << std::endl;
454 return true;
455 }
456
457 if (accession_resolver_.exists(evidence))
458 {
459 return digestion_.isValidProduct(AASequence::fromString(accession_resolver_.getValue(evidence).sequence), evidence.getStart(), evidence.getEnd() - evidence.getStart(),
460 ignore_missed_cleavages_, methionine_cleavage_);
461 }
462 else
463 {
464 if (evidence.getProteinAccession().empty())
465 {
466 OPENMS_LOG_WARN << "Peptide accession not available! Skipping Evidence." << std::endl;
467 }
468 else
469 {
470 OPENMS_LOG_WARN << "Peptide accession '" << evidence.getProteinAccession() << "' not found in fasta file!" << std::endl;
471 }
472 return true;
473 }
474 }
475
477 {
478 IDFilter::FilterPeptideEvidences<IDFilter::DigestionFilter>(*this, peptides);
479 }
480 };
481
483
484
487
489 template<class IdentificationType>
490 struct HasNoHits {
491 typedef IdentificationType argument_type; // for use as a predicate
492
493 bool operator()(const IdentificationType& id) const
494 {
495 return id.getHits().empty();
496 }
497 };
498
500
501
504
506 struct HasRTInRange;
507
509 struct HasMZInRange;
510
512
513
520
522 template<class Container, class Predicate>
523 static void removeMatchingItems(Container& items, const Predicate& pred)
524 {
525 items.erase(std::remove_if(items.begin(), items.end(), pred), items.end());
526 }
527
529 template<class Container, class Predicate>
530 static void keepMatchingItems(Container& items, const Predicate& pred)
531 {
532 items.erase(std::remove_if(items.begin(), items.end(), std::not_fn(pred)), items.end());
533 }
534
536 template<class Container, class Predicate>
537 static void moveMatchingItems(Container& items, const Predicate& pred, Container& target)
538 {
539 auto part = std::partition(items.begin(), items.end(), std::not_fn(pred));
540 std::move(part, items.end(), std::back_inserter(target));
541 items.erase(part, items.end());
542 }
543
545 template<class IDContainer, class Predicate>
546 static void removeMatchingItemsUnroll(IDContainer& items, const Predicate& pred)
547 {
548 for (auto& item : items)
549 {
550 removeMatchingItems(item.getHits(), pred);
551 }
552 }
553
555 template<class IDContainer, class Predicate>
556 static void keepMatchingItemsUnroll(IDContainer& items, const Predicate& pred)
557 {
558 for (auto& item : items)
559 {
560 keepMatchingItems(item.getHits(), pred);
561 }
562 }
563
564 template<class MapType, class Predicate>
565 static void keepMatchingPeptideHits(MapType& prot_and_pep_ids, Predicate& pred)
566 {
567 for (auto& feat : prot_and_pep_ids)
568 {
569 keepMatchingItemsUnroll(feat.getPeptideIdentifications(), pred);
570 }
571 keepMatchingItemsUnroll(prot_and_pep_ids.getUnassignedPeptideIdentifications(), pred);
572 }
573
574 template<class MapType, class Predicate>
575 static void removeMatchingPeptideHits(MapType& prot_and_pep_ids, Predicate& pred)
576 {
577 for (auto& feat : prot_and_pep_ids)
578 {
579 removeMatchingItemsUnroll(feat.getPeptideIdentifications(), pred);
580 }
581 removeMatchingItemsUnroll(prot_and_pep_ids.getUnassignedPeptideIdentifications(), pred);
582 }
583
584 template<IsFeatureOrConsensusMap MapType, class Predicate>
585 static void removeMatchingPeptideIdentifications(MapType& prot_and_pep_ids, Predicate& pred)
586 {
587 for (auto& feat : prot_and_pep_ids)
588 {
589 removeMatchingItems(feat.getPeptideIdentifications(), pred);
590 }
591 removeMatchingItems(prot_and_pep_ids.getUnassignedPeptideIdentifications(), pred);
592 }
593
594 // Specialization for PeptideIdentificationList
595 template<class Predicate>
597 {
598 removeMatchingItems(pep_ids, pred);
599 }
600
602
603
606
608 template<class IdentificationType>
609 static Size countHits(const std::vector<IdentificationType>& ids)
610 {
611 Size counter = 0;
612 for (typename std::vector<IdentificationType>::const_iterator id_it = ids.begin(); id_it != ids.end(); ++id_it)
613 {
614 counter += id_it->getHits().size();
615 }
616 return counter;
617 }
618
621 {
622 Size counter = 0;
623 for (const auto& id : ids)
624 {
625 counter += id.getHits().size();
626 }
627 return counter;
628 }
629
631 static void filterHitsByRank(PeptideIdentificationList& ids, Size min_rank, Size max_rank)
632 {
633 std::vector<PeptideIdentification>& vec = ids.getData();
634 filterHitsByRank(vec, min_rank, max_rank);
635 }
636
638 static void removeHitsMatchingProteins(PeptideIdentificationList& ids, const std::set<String>& accessions)
639 {
640 std::vector<PeptideIdentification>& vec = ids.getData();
641 removeHitsMatchingProteins(vec, accessions);
642 }
643
645 static void keepHitsMatchingProteins(PeptideIdentificationList& ids, const std::set<String>& accessions)
646 {
647 std::vector<PeptideIdentification>& vec = ids.getData();
648 keepHitsMatchingProteins(vec, accessions);
649 }
650
652 static bool getBestHit(PeptideIdentificationList& ids, bool assume_sorted, PeptideHit& best_hit)
653 {
654 std::vector<PeptideIdentification>& vec = ids.getData();
655 return getBestHit(vec, assume_sorted, best_hit);
656 }
657
660 {
661 std::vector<PeptideIdentification>& vec = ids.getData();
662 removeEmptyIdentifications(vec);
663 }
664
678 template<class IdentificationType>
679 static bool getBestHit(const std::vector<IdentificationType>& identifications, bool assume_sorted, typename IdentificationType::HitType& best_hit)
680 {
681 if (identifications.empty())
682 return false;
683
684 typename std::vector<IdentificationType>::const_iterator best_id_it = identifications.end();
685 typename std::vector<typename IdentificationType::HitType>::const_iterator best_hit_it;
686
687 for (typename std::vector<IdentificationType>::const_iterator id_it = identifications.begin(); id_it != identifications.end(); ++id_it)
688 {
689 if (id_it->getHits().empty())
690 continue;
691
692 if (best_id_it == identifications.end()) // no previous "best" hit
693 {
694 best_id_it = id_it;
695 best_hit_it = id_it->getHits().begin();
696 }
697 else if (best_id_it->getScoreType() != id_it->getScoreType())
698 {
699 throw Exception::InvalidValue(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, "Can't compare scores of different types", best_id_it->getScoreType() + "/" + id_it->getScoreType());
700 }
701
702 bool higher_better = best_id_it->isHigherScoreBetter();
703 for (typename std::vector<typename IdentificationType::HitType>::const_iterator hit_it = id_it->getHits().begin(); hit_it != id_it->getHits().end(); ++hit_it)
704 {
705 if ((higher_better && (hit_it->getScore() > best_hit_it->getScore())) || (!higher_better && (hit_it->getScore() < best_hit_it->getScore())))
706 {
707 best_hit_it = hit_it;
708 }
709 if (assume_sorted)
710 break; // only consider the first hit
711 }
712 }
713
714 if (best_id_it == identifications.end())
715 {
716 return false; // no hits in any IDs
717 }
718
719 best_hit = *best_hit_it;
720 return true;
721 }
722
730 static void extractPeptideSequences(const PeptideIdentificationList& peptides, std::set<String>& sequences, bool ignore_mods = false);
731
737 static std::map<String, std::vector<ProteinHit>> extractUnassignedProteins(ConsensusMap& cmap);
738
744 template<class EvidenceFilter>
745 static void FilterPeptideEvidences(EvidenceFilter& filter, PeptideIdentificationList& peptides)
746 {
747 for (PeptideIdentificationList::iterator pep_it = peptides.begin(); pep_it != peptides.end(); ++pep_it)
748 {
749 for (std::vector<PeptideHit>::iterator hit_it = pep_it->getHits().begin(); hit_it != pep_it->getHits().end(); ++hit_it)
750 {
751 std::vector<PeptideEvidence> evidences;
752 remove_copy_if(hit_it->getPeptideEvidences().begin(), hit_it->getPeptideEvidences().end(), back_inserter(evidences), std::not_fn(filter));
753 hit_it->setPeptideEvidences(evidences);
754 }
755 }
756 }
757
759
760
765 static void removeUnreferencedProteins(ConsensusMap& cmap, bool include_unassigned);
766
768 static void removeUnreferencedProteins(std::vector<ProteinIdentification>& proteins, const PeptideIdentificationList& peptides);
771
787 static void removeDanglingProteinReferences(PeptideIdentificationList& peptides, const std::vector<ProteinIdentification>& proteins, bool remove_peptides_without_reference = false);
788
803 static void removeDanglingProteinReferences(ConsensusMap& cmap, bool remove_peptides_without_reference = false);
804
819 static void removeDanglingProteinReferences(ConsensusMap& cmap, const ProteinIdentification& ref_run, bool remove_peptides_without_reference = false);
820
829 static bool updateProteinGroups(std::vector<ProteinIdentification::ProteinGroup>& groups, const std::vector<ProteinHit>& hits);
830
837 static void removeUngroupedProteins(const std::vector<ProteinIdentification::ProteinGroup>& groups, std::vector<ProteinHit>& hits);
839
840
843
845 template<IsPeptideOrProteinIdentification IdentificationType>
846 static void removeEmptyIdentifications(std::vector<IdentificationType>& ids)
847 {
848 struct HasNoHits<IdentificationType> empty_filter;
849 removeMatchingItems(ids, empty_filter);
850 }
851
857 template<class IdentificationType>
858 static void filterHitsByScore(std::vector<IdentificationType>& ids, double threshold_score)
859 {
860 for (typename std::vector<IdentificationType>::iterator id_it = ids.begin(); id_it != ids.end(); ++id_it)
861 {
862 struct HasGoodScore<typename IdentificationType::HitType> score_filter(threshold_score, id_it->isHigherScoreBetter());
863 keepMatchingItems(id_it->getHits(), score_filter);
864 }
865 }
866
880 template<class IdentificationType>
881 static void filterHitsByScore(std::vector<IdentificationType>& ids, double threshold_score, IDScoreSwitcherAlgorithm::ScoreType score_type)
882 {
884 bool at_least_one_found = false;
885 for (IdentificationType& id : ids)
886 {
887 if (switcher.isScoreType(id.getScoreType(), score_type))
888 {
889 struct HasGoodScore<typename IdentificationType::HitType> score_filter(threshold_score, id.isHigherScoreBetter());
890 keepMatchingItems(id.getHits(), score_filter);
891 }
892 else
893 {
894 // If one assumes they are all the same in the vector, this could be done in the beginning.
895 auto result = switcher.findScoreType<IdentificationType>(id, score_type);
896 if (!result.score_name.empty())
897 {
898 String metaval = result.score_name;
899 if (switcher.isScoreTypeHigherBetter(score_type))
900 {
901 struct HasMinMetaValue<typename IdentificationType::HitType> score_filter(metaval, threshold_score);
902 keepMatchingItems(id.getHits(), score_filter);
903 }
904 else
905 {
906 struct HasMaxMetaValue<typename IdentificationType::HitType> score_filter(metaval, threshold_score);
907 keepMatchingItems(id.getHits(), score_filter);
908 }
909 at_least_one_found = true;
910 }
911 }
912 }
913 if (!at_least_one_found) OPENMS_LOG_WARN << String("Warning: No hit with the given score_type found. All hits removed.") << std::endl;
914 }
915
922 static void filterGroupsByScore(std::vector<ProteinIdentification::ProteinGroup>& grps, double threshold_score, bool higher_better);
923
929 template<class IdentificationType>
930 static void filterHitsByScore(IdentificationType& id, double threshold_score)
931 {
932 struct HasGoodScore<typename IdentificationType::HitType> score_filter(threshold_score, id.isHigherScoreBetter());
933 keepMatchingItems(id.getHits(), score_filter);
934 }
935
941 template<class IdentificationType>
942 static void keepNBestHits(std::vector<IdentificationType>& ids, Size n)
943 {
944 for (typename std::vector<IdentificationType>::iterator id_it = ids.begin(); id_it != ids.end(); ++id_it)
945 {
946 id_it->sort();
947 if (n < id_it->getHits().size())
948 id_it->getHits().resize(n);
949 }
950 }
951
960 static void keepNBestHits(PeptideIdentificationList& pep_ids, Size n)
961 {
962 std::vector<PeptideIdentification>& vec = pep_ids.getData();
963 keepNBestHits(vec, n);
964 }
965
980 template<class IdentificationType>
981 static void filterHitsByRank(std::vector<IdentificationType>& ids, Size min_rank, Size max_rank)
982 {
983 for (auto& id : ids)
984 {
985 auto& hits = id.getHits();
986 if (hits.empty()) continue;
987
988 id.sort(); // Ensure hits are properly sorted
989
990 // ignore max_rank?
991 if (max_rank < min_rank) max_rank = hits.size();
992
993 Size rank = 1;
994 double last_score = hits.front().getScore();
995
996 // Remove hits not within [min_rank, max_rank], while computing rank on the fly
997 hits.erase(
998 std::remove_if(hits.begin(), hits.end(),
999 [&](const auto& hit) {
1000 if (hit.getScore() != last_score)
1001 {
1002 ++rank;
1003 last_score = hit.getScore();
1004 }
1005 return rank < min_rank || rank > max_rank;
1006 }),
1007 hits.end()
1008 );
1009 }
1010 }
1011
1019 template<class IdentificationType>
1020 static void removeDecoyHits(std::vector<IdentificationType>& ids)
1021 {
1022 struct HasDecoyAnnotation<typename IdentificationType::HitType> decoy_filter;
1023 for (typename std::vector<IdentificationType>::iterator id_it = ids.begin(); id_it != ids.end(); ++id_it)
1024 {
1025 removeMatchingItems(id_it->getHits(), decoy_filter);
1026 }
1027 }
1028
1036 template<class IdentificationType>
1037 static void removeHitsMatchingProteins(std::vector<IdentificationType>& ids, const std::set<String> accessions)
1038 {
1039 HasMatchingAccession<typename IdentificationType::HitType> acc_filter(accessions);
1040 for (auto& id_it : ids)
1041 {
1042 removeMatchingItems(id_it.getHits(), acc_filter);
1043 }
1044 }
1045
1053 template<IsPeptideOrProteinIdentification IdentificationType>
1054 static void keepHitsMatchingProteins(IdentificationType& id, const std::set<String>& accessions)
1055 {
1056 HasMatchingAccession<typename IdentificationType::HitType> acc_filter(accessions);
1057 keepMatchingItems(id.getHits(), acc_filter);
1058 }
1059
1067 template<class IdentificationType>
1068 static void keepHitsMatchingProteins(std::vector<IdentificationType>& ids, const std::set<String>& accessions)
1069 {
1070 for (auto& id_it : ids) keepHitsMatchingProteins(id_it, accessions);
1071 }
1072
1074
1075
1078
1085 static void keepBestPeptideHits(PeptideIdentificationList& peptides, bool strict = false);
1086
1095 static void filterPeptidesByLength(PeptideIdentificationList& peptides, Size min_length, Size max_length = UINT_MAX);
1096
1105 static void filterPeptidesByCharge(PeptideIdentificationList& peptides, Int min_charge, Int max_charge);
1106
1108 static void filterPeptidesByRT(PeptideIdentificationList& peptides, double min_rt, double max_rt);
1109
1111 static void filterPeptidesByMZ(PeptideIdentificationList& peptides, double min_mz, double max_mz);
1112
1124 static void filterPeptidesByMZError(PeptideIdentificationList& peptides, double mass_error, bool unit_ppm);
1125
1126
1133 template<class Filter>
1134 static void filterPeptideEvidences(Filter& filter, PeptideIdentificationList& peptides);
1135
1147 static void filterPeptidesByRTPredictPValue(PeptideIdentificationList& peptides, const String& metavalue_key, double threshold = 0.05);
1148
1150 static void removePeptidesWithMatchingModifications(PeptideIdentificationList& peptides, const std::set<String>& modifications);
1151
1152 static void removePeptidesWithMatchingRegEx(PeptideIdentificationList& peptides, const String& regex);
1153
1155 static void keepPeptidesWithMatchingModifications(PeptideIdentificationList& peptides, const std::set<String>& modifications);
1156
1164 static void removePeptidesWithMatchingSequences(PeptideIdentificationList& peptides, const PeptideIdentificationList& bad_peptides, bool ignore_mods = false);
1165
1173 static void keepPeptidesWithMatchingSequences(PeptideIdentificationList& peptides, const PeptideIdentificationList& good_peptides, bool ignore_mods = false);
1174
1176 static void keepUniquePeptidesPerProtein(PeptideIdentificationList& peptides);
1177
1184 static void removeDuplicatePeptideHits(PeptideIdentificationList& peptides, bool seq_only = false);
1185
1187
1188
1191
1193 static void filterHitsByScore(AnnotatedMSRun& annotated_data,
1194 double peptide_threshold_score,
1195 double protein_threshold_score)
1196 {
1197 // filter protein hits:
1198 filterHitsByScore(annotated_data.getProteinIdentifications(),
1199 protein_threshold_score);
1200 // don't remove empty protein IDs - they contain search meta data and may
1201 // be referenced by peptide IDs (via run ID)
1202
1203 // filter peptide hits:
1204 for (PeptideIdentification& peptide_id : annotated_data.getPeptideIdentifications())
1205 {
1206 filterHitsByScore(peptide_id, peptide_threshold_score);
1207 }
1208 removeDanglingProteinReferences(annotated_data.getPeptideIdentifications(), annotated_data.getProteinIdentifications());
1209 }
1210
1212 static void keepNBestHits(AnnotatedMSRun& annotated_data, Size n)
1213 {
1214 // don't filter the protein hits by "N best" here - filter the peptides
1215 // and update the protein hits!
1216 PeptideIdentificationList all_peptides; // IDs from all spectra
1217 // filter peptide hits:
1218 for (PeptideIdentification& peptide_id : annotated_data.getPeptideIdentifications())
1219 {
1220 // Create a temporary vector with a single PeptideIdentification
1221 PeptideIdentificationList temp_vec = {peptide_id};
1222 keepNBestHits(temp_vec, n);
1223 // Copy back the filtered hits
1224 if (!temp_vec.empty())
1225 {
1226 peptide_id = temp_vec[0];
1227 }
1228 else
1229 {
1230 peptide_id.getHits().clear();
1231 }
1232
1233 // Since we're working with individual PeptideIdentifications, we don't need to remove empty ones
1234 // but we still need to update protein references
1235 temp_vec = {peptide_id};
1236 removeDanglingProteinReferences(temp_vec, annotated_data.getProteinIdentifications());
1237 all_peptides.push_back(peptide_id);
1238 }
1239 // update protein hits:
1240 removeUnreferencedProteins(annotated_data.getProteinIdentifications(), all_peptides);
1241 }
1242
1245 static void keepNBestSpectra(PeptideIdentificationList& peptides, Size n);
1246
1248 template<class MapType>
1249 static void keepNBestPeptideHits(MapType& map, Size n)
1250 {
1251 // The rank predicate needs annotated ranks, not sure if they are always updated. Use the following instead,
1252 // which sorts Hits first.
1253 for (auto& feat : map)
1254 {
1255 keepNBestHits(feat.getPeptideIdentifications(), n);
1256 }
1257 keepNBestHits(map.getUnassignedPeptideIdentifications(), n);
1258 }
1259
1260 template<IsNotIdentificationVector MapType>
1261 static void removeEmptyIdentifications(MapType& prot_and_pep_ids)
1262 {
1263 const auto pred = HasNoHits<PeptideIdentification>();
1264 removeMatchingPeptideIdentifications(prot_and_pep_ids, pred);
1265 }
1266
1268 static void keepBestPerPeptide(PeptideIdentificationList& pep_ids, bool ignore_mods, bool ignore_charges, Size nr_best_spectrum)
1269 {
1270 annotateBestPerPeptide(pep_ids, ignore_mods, ignore_charges, nr_best_spectrum);
1271 HasMetaValue<PeptideHit> best_per_peptide {"best_per_peptide", 1};
1272 keepMatchingItemsUnroll(pep_ids, best_per_peptide);
1273 }
1274
1275 static void keepBestPerPeptidePerRun(std::vector<ProteinIdentification>& prot_ids, PeptideIdentificationList& pep_ids, bool ignore_mods, bool ignore_charges, Size nr_best_spectrum)
1276 {
1277 annotateBestPerPeptidePerRun(prot_ids, pep_ids, ignore_mods, ignore_charges, nr_best_spectrum);
1278 HasMetaValue<PeptideHit> best_per_peptide {"best_per_peptide", 1};
1279 keepMatchingItemsUnroll(pep_ids, best_per_peptide);
1280 }
1281
1282 // TODO allow skipping unassigned?
1283 template<class MapType>
1284 static void annotateBestPerPeptidePerRun(MapType& prot_and_pep_ids, bool ignore_mods, bool ignore_charges, Size nr_best_spectrum)
1285 {
1286 const auto& prot_ids = prot_and_pep_ids.getProteinIdentifications();
1287
1288 RunToSequenceToChargeToPepHitP best_peps_per_run;
1289 for (const auto& idrun : prot_ids)
1290 {
1291 best_peps_per_run[idrun.getIdentifier()] = SequenceToChargeToPepHitP();
1292 }
1293
1294 for (auto& feat : prot_and_pep_ids)
1295 {
1296 annotateBestPerPeptidePerRunWithData(best_peps_per_run, feat.getPeptideIdentifications(), ignore_mods, ignore_charges, nr_best_spectrum);
1297 }
1298
1299 annotateBestPerPeptidePerRunWithData(best_peps_per_run, prot_and_pep_ids.getUnassignedPeptideIdentifications(), ignore_mods, ignore_charges, nr_best_spectrum);
1300 }
1301
1302 template<class MapType>
1303 static void keepBestPerPeptidePerRun(MapType& prot_and_pep_ids, bool ignore_mods, bool ignore_charges, Size nr_best_spectrum)
1304 {
1305 annotateBestPerPeptidePerRun(prot_and_pep_ids, ignore_mods, ignore_charges, nr_best_spectrum);
1306 HasMetaValue<PeptideHit> best_per_peptide {"best_per_peptide", 1};
1307 keepMatchingPeptideHits(prot_and_pep_ids, best_per_peptide);
1308 }
1309
1312 static void annotateBestPerPeptidePerRun(const std::vector<ProteinIdentification>& prot_ids, PeptideIdentificationList& pep_ids, bool ignore_mods, bool ignore_charges,
1313 Size nr_best_spectrum)
1314 {
1315 RunToSequenceToChargeToPepHitP best_peps_per_run;
1316 for (const auto& id : prot_ids)
1317 {
1318 best_peps_per_run[id.getIdentifier()] = SequenceToChargeToPepHitP();
1319 }
1320 annotateBestPerPeptidePerRunWithData(best_peps_per_run, pep_ids, ignore_mods, ignore_charges, nr_best_spectrum);
1321 }
1322
1326 static void annotateBestPerPeptidePerRunWithData(RunToSequenceToChargeToPepHitP& best_peps_per_run, PeptideIdentificationList& pep_ids, bool ignore_mods, bool ignore_charges,
1327 Size nr_best_spectrum)
1328 {
1329 for (auto& pep : pep_ids)
1330 {
1331 SequenceToChargeToPepHitP& best_pep = best_peps_per_run[pep.getIdentifier()];
1332 annotateBestPerPeptideWithData(best_pep, pep, ignore_mods, ignore_charges, nr_best_spectrum);
1333 }
1334 }
1335
1339 static void annotateBestPerPeptide(PeptideIdentificationList& pep_ids, bool ignore_mods, bool ignore_charges, Size nr_best_spectrum)
1340 {
1341 SequenceToChargeToPepHitP best_pep;
1342 for (auto& pep : pep_ids)
1343 {
1344 annotateBestPerPeptideWithData(best_pep, pep, ignore_mods, ignore_charges, nr_best_spectrum);
1345 }
1346 }
1347
1352 static void annotateBestPerPeptideWithData(SequenceToChargeToPepHitP& best_pep, PeptideIdentification& pep, bool ignore_mods, bool ignore_charges, Size nr_best_spectrum)
1353 {
1354 bool higher_score_better = pep.isHigherScoreBetter();
1355 // make sure that first = best hit
1356 pep.sort();
1357
1358 auto pepIt = pep.getHits().begin();
1359 auto pepItEnd = nr_best_spectrum == 0 || pep.getHits().size() <= nr_best_spectrum ? pep.getHits().end() : pep.getHits().begin() + nr_best_spectrum;
1360 for (; pepIt != pepItEnd; ++pepIt)
1361 {
1362 PeptideHit& hit = *pepIt;
1363
1364 String lookup_seq;
1365 if (ignore_mods)
1366 {
1367 lookup_seq = hit.getSequence().toUnmodifiedString();
1368 }
1369 else
1370 {
1371 lookup_seq = hit.getSequence().toString();
1372 }
1373
1374 int lookup_charge = 0;
1375 if (!ignore_charges)
1376 {
1377 lookup_charge = hit.getCharge();
1378 }
1379
1380 // try to insert
1381 auto it_inserted = best_pep.emplace(std::move(lookup_seq), ChargeToPepHitP());
1382 auto it_inserted_chg = it_inserted.first->second.emplace(lookup_charge, &hit);
1383
1384 PeptideHit*& p = it_inserted_chg.first->second; // now this gets either the old one if already present, or this
1385 if (!it_inserted_chg.second) // was already present -> possibly update
1386 {
1387 if ((higher_score_better && (hit.getScore() > p->getScore())) || (!higher_score_better && (hit.getScore() < p->getScore())))
1388 {
1389 p->setMetaValue("best_per_peptide", 0);
1390 hit.setMetaValue("best_per_peptide", 1);
1391 p = &hit;
1392 }
1393 else // note that this was def. not the best
1394 {
1395 // TODO if it is only about filtering, we can omit writing this metavalue (absence = false)
1396 hit.setMetaValue("best_per_peptide", 0);
1397 }
1398 }
1399 else // newly inserted -> first for that sequence (and optionally charge)
1400 {
1401 hit.setMetaValue("best_per_peptide", 1);
1402 }
1403 }
1404 }
1405
1408 AnnotatedMSRun& experiment,
1409 const std::vector<FASTAFile::FASTAEntry>& proteins)
1410 {
1411 std::set<String> accessions;
1412 for (auto it = proteins.begin(); it != proteins.end(); ++it)
1413 {
1414 accessions.insert(it->identifier);
1415 }
1416
1417 // filter protein hits:
1418 keepHitsMatchingProteins(experiment.getProteinIdentifications(), accessions);
1419
1420 // filter peptide hits:
1421 // std::pair<OpenMS::MSSpectrum&, OpenMS::PeptideIdentification&>
1422 for (auto [spectrum, peptide_id] : experiment)
1423 {
1424 if (spectrum.getMSLevel() == 2)
1425 {
1426 keepHitsMatchingProteins(peptide_id, accessions);
1427 }
1428 }
1429 removeEmptyIdentifications(experiment.getPeptideIdentifications());
1430 }
1431
1433
1434
1437
1448
1461
1467 static void removeDecoys(IdentificationData& id_data);
1469
1470 // Specific overloads for PeptideIdentificationList to ensure correct template resolution
1472 {
1473 removeDecoyHits(ids.getData());
1474 }
1475
1476 static void filterHitsByScore(PeptideIdentificationList& ids, double threshold_score)
1477 {
1478 filterHitsByScore(ids.getData(), threshold_score);
1479 }
1480
1481 static void removeUnreferencedProteins(std::vector<ProteinIdentification>& proteins, PeptideIdentificationList& ids)
1482 {
1483 removeUnreferencedProteins(proteins, ids.getData());
1484 }
1485 };
1486
1487} // namespace OpenMS
#define OPENMS_LOG_WARN
Macro for warnings.
Definition LogStream.h:550
String toUnmodifiedString() const
returns the peptide as string without any modifications or (e.g., "PEPTIDER")
Class for storing MS run data with peptide and protein identifications.
Definition AnnotatedMSRun.h:38
PeptideIdentificationList & getPeptideIdentifications()
Get all peptide identifications for all spectra.
std::vector< ProteinIdentification > & getProteinIdentifications()
Get the protein identification.
Definition AnnotatedMSRun.h:85
A container for consensus elements.
Definition ConsensusMap.h:68
Class to hold strings, numeric values, lists of strings and lists of numeric values.
Definition DataValue.h:34
bool isEmpty() const
Test if the value is empty.
Class for the enzymatic digestion of sequences.
Definition EnzymaticDigestion.h:38
bool filterByMissedCleavages(const String &sequence, const std::function< bool(const Int)> &filter) const
Filter based on the number of missed cleavages.
Exception indicating that an invalid parameter was handed over to an algorithm.
Definition Exception.h:317
Invalid value exception.
Definition Exception.h:306
const VecMember & getData() const
read-only access to the underlying data
Definition ExposedVector.h:328
typename VecMember::iterator iterator
Definition ExposedVector.h:68
iterator begin() noexcept
Definition ExposedVector.h:104
iterator end() noexcept
Definition ExposedVector.h:108
Filter Peptide Hit by its digestion product.
Definition IDFilter.h:394
Int max_cleavages_
Definition IDFilter.h:398
EnzymaticDigestion & digestion_
Definition IDFilter.h:396
PeptideHit argument_type
Definition IDFilter.h:401
Int min_cleavages_
Definition IDFilter.h:397
bool operator()(PeptideHit &p) const
Definition IDFilter.h:413
void filterPeptideSequences(std::vector< PeptideHit > &hits)
Definition IDFilter.h:423
PeptideDigestionFilter(EnzymaticDigestion &digestion, Int min, Int max)
Definition IDFilter.h:402
static Int disabledValue()
Definition IDFilter.h:406
Collection of functions for filtering peptide and protein identifications.
Definition IDFilter.h:71
static void removeHitsMatchingProteins(PeptideIdentificationList &ids, const std::set< String > &accessions)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition IDFilter.h:638
static void filterHitsByScore(std::vector< IdentificationType > &ids, double threshold_score)
Filters peptide or protein identifications according to the score of the hits.
Definition IDFilter.h:858
static void removeUnreferencedProteins(std::vector< ProteinIdentification > &proteins, const PeptideIdentificationList &peptides)
Removes protein hits from proteins that are not referenced by a peptide in peptides.
static void removeDanglingProteinReferences(ConsensusMap &cmap, const ProteinIdentification &ref_run, bool remove_peptides_without_reference=false)
Removes dangling protein references from peptide hits using a reference protein run.
static void moveMatchingItems(Container &items, const Predicate &pred, Container &target)
Move items that satisfy a condition to a container (e.g. vector)
Definition IDFilter.h:537
static void keepBestMatchPerObservation(IdentificationData &id_data, IdentificationData::ScoreTypeRef score_ref)
Filter IdentificationData to keep only the best match (e.g. PSM) for each observation (e....
std::map< std::string, SequenceToChargeToPepHitP > RunToSequenceToChargeToPepHitP
Definition IDFilter.h:82
static void keepMatchingPeptideHits(MapType &prot_and_pep_ids, Predicate &pred)
Definition IDFilter.h:565
static void removeMatchingItems(Container &items, const Predicate &pred)
Remove items that satisfy a condition from a container (e.g. vector)
Definition IDFilter.h:523
std::unordered_map< std::string, ChargeToPepHitP > SequenceToChargeToPepHitP
Definition IDFilter.h:81
static void removeDecoyHits(PeptideIdentificationList &ids)
Definition IDFilter.h:1471
static void removeEmptyIdentifications(std::vector< IdentificationType > &ids)
Removes peptide or protein identifications that have no hits in them.
Definition IDFilter.h:846
static void removeEmptyIdentifications(PeptideIdentificationList &ids)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition IDFilter.h:659
IDFilter()=default
Constructor.
static void keepMatchingItemsUnroll(IDContainer &items, const Predicate &pred)
Keep Hit items that satisfy a condition in one of our ID containers (e.g. vector of Peptide or Protei...
Definition IDFilter.h:556
static void removeDanglingProteinReferences(ConsensusMap &cmap, bool remove_peptides_without_reference=false)
Removes dangling protein references from peptide hits in a ConsensusMap.
static void removeDecoys(IdentificationData &id_data)
Filter IdentificationData to remove parent sequences annotated as decoys.
static void keepHitsMatchingProteins(PeptideIdentificationList &ids, const std::set< String > &accessions)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition IDFilter.h:645
virtual ~IDFilter()=default
Destructor.
static void keepMatchingItems(Container &items, const Predicate &pred)
Keep items that satisfy a condition in a container (e.g. vector), removing all others.
Definition IDFilter.h:530
static void filterObservationMatchesByScore(IdentificationData &id_data, IdentificationData::ScoreTypeRef score_ref, double cutoff)
Filter observation matches (e.g. PSMs) in IdentificationData by score.
static void keepHitsMatchingProteins(AnnotatedMSRun &experiment, const std::vector< FASTAFile::FASTAEntry > &proteins)
Filters AnnotatedMSRun according to the given proteins.
Definition IDFilter.h:1407
static void removeMatchingPeptideHits(MapType &prot_and_pep_ids, Predicate &pred)
Definition IDFilter.h:575
static void filterHitsByRank(PeptideIdentificationList &ids, Size min_rank, Size max_rank)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition IDFilter.h:631
static bool updateProteinGroups(std::vector< ProteinIdentification::ProteinGroup > &groups, const std::vector< ProteinHit > &hits)
Update protein groups after protein hits were filtered.
static Size countHits(const PeptideIdentificationList &ids)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition IDFilter.h:620
static bool getBestHit(PeptideIdentificationList &ids, bool assume_sorted, PeptideHit &best_hit)
This is an overloaded member function, provided for convenience. It differs from the above function o...
Definition IDFilter.h:652
static void removeMatchingItemsUnroll(IDContainer &items, const Predicate &pred)
Remove Hit items that satisfy a condition in one of our ID containers (e.g. vector of Peptide or Prot...
Definition IDFilter.h:546
static void filterHitsByScore(PeptideIdentificationList &ids, double threshold_score)
Definition IDFilter.h:1476
static void removeMatchingPeptideIdentifications(MapType &prot_and_pep_ids, Predicate &pred)
Definition IDFilter.h:585
static void FilterPeptideEvidences(EvidenceFilter &filter, PeptideIdentificationList &peptides)
remove peptide evidences based on a filter
Definition IDFilter.h:745
static Size countHits(const std::vector< IdentificationType > &ids)
Returns the total number of peptide/protein hits in a vector of peptide/protein identifications.
Definition IDFilter.h:609
static void removeUnreferencedProteins(std::vector< ProteinIdentification > &proteins, PeptideIdentificationList &ids)
Definition IDFilter.h:1481
static void removeDanglingProteinReferences(PeptideIdentificationList &peptides, const std::vector< ProteinIdentification > &proteins, bool remove_peptides_without_reference=false)
Removes dangling protein references from peptide hits.
static bool getBestHit(const std::vector< IdentificationType > &identifications, bool assume_sorted, typename IdentificationType::HitType &best_hit)
Finds the best-scoring hit in a vector of peptide or protein identifications.
Definition IDFilter.h:679
static void extractPeptideSequences(const PeptideIdentificationList &peptides, std::set< String > &sequences, bool ignore_mods=false)
Extracts all unique peptide sequences from a list of peptide IDs.
static std::map< String, std::vector< ProteinHit > > extractUnassignedProteins(ConsensusMap &cmap)
Extracts all proteins not matched by PSMs in features.
static void removeUngroupedProteins(const std::vector< ProteinIdentification::ProteinGroup > &groups, std::vector< ProteinHit > &hits)
Update protein hits after protein groups were filtered.
static void removeMatchingPeptideIdentifications(PeptideIdentificationList &pep_ids, Predicate &pred)
Definition IDFilter.h:596
static void removeUnreferencedProteins(ConsensusMap &cmap, bool include_unassigned)
static void removeUnreferencedProteins(ProteinIdentification &proteins, const PeptideIdentificationList &peptides)
Removes protein hits from proteins that are not referenced by a peptide in peptides.
std::map< Int, PeptideHit * > ChargeToPepHitP
Typedefs.
Definition IDFilter.h:80
This class is used to switch identification scores within identification or consensus feature maps.
Definition IDScoreSwitcherAlgorithm.h:42
bool isScoreTypeHigherBetter(ScoreType score_type)
Determines whether a higher score type is better given a ScoreType enum.
Definition IDScoreSwitcherAlgorithm.h:139
bool isScoreType(const String &score_name, const ScoreType &type) const
Checks if the given score name corresponds to a specific score type.
Definition IDScoreSwitcherAlgorithm.h:75
ScoreSearchResult findScoreType(const IDType &id, ScoreType score_type) const
Searches for a general score type (e.g. PEP, QVAL) in an identification data structure.
Definition IDScoreSwitcherAlgorithm.h:176
Definition IdentificationData.h:87
In-Memory representation of a mass spectrometry run.
Definition MSExperiment.h:49
Representation of a peptide evidence.
Definition PeptideEvidence.h:28
Int getStart() const
get the position in the protein (starting at 0 for the N-terminus). If not available UNKNOWN_POSITION...
bool hasValidLimits() const
start and end numbers in evidence represent actual numeric indices
Int getEnd() const
get the position of the last AA of the peptide in protein coordinates (starting at 0 for the N-termin...
const String & getProteinAccession() const
get the protein accession the peptide matches to. If not available the empty string is returned.
Represents a single spectrum match (candidate) for a specific tandem mass spectrum (MS/MS).
Definition PeptideHit.h:52
const AASequence & getSequence() const
returns the peptide sequence
std::set< String > extractProteinAccessionsSet() const
extracts the set of non-empty protein accessions from peptide evidences
Container for peptide identifications from multiple spectra.
Definition PeptideIdentificationList.h:66
Class for the enzymatic digestion of proteins represented as AASequence or String.
Definition ProteaseDigestion.h:32
bool isValidProduct(const String &protein, int pep_pos, int pep_length, bool ignore_missed_cleavages=true, bool allow_nterm_protein_cleavage=false, bool allow_random_asp_pro_cleavage=false) const
Variant of EnzymaticDigestion::isValidProduct() with support for n-term protein cleavage and random D...
Representation of a protein hit.
Definition ProteinHit.h:35
const String & getAccession() const
returns the accession of the protein
Representation of a protein identification run.
Definition ProteinIdentification.h:54
A more convenient string class.
Definition String.h:34
Definition IDFilter.h:40
Concept to exclude std::vector of identification types (used to disambiguate template overloads)
Definition IDFilter.h:45
int Int
Signed integer type.
Definition Types.h:72
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition Types.h:97
Main OpenMS namespace.
Definition openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19
FASTA entry type (identifier, description and sequence) The first String corresponds to the identifie...
Definition FASTAFile.h:46
String identifier
Definition FASTAFile.h:47
Is peptide evidence digestion product of some protein.
Definition IDFilter.h:435
DigestionFilter(std::vector< FASTAFile::FASTAEntry > &entries, ProteaseDigestion &digestion, bool ignore_missed_cleavages, bool methionine_cleavage)
Definition IDFilter.h:444
GetMatchingItems< PeptideEvidence, FASTAFile::FASTAEntry > accession_resolver_
Definition IDFilter.h:439
void filterPeptideEvidences(PeptideIdentificationList &peptides)
Definition IDFilter.h:476
bool operator()(const PeptideEvidence &evidence) const
Definition IDFilter.h:449
bool ignore_missed_cleavages_
Definition IDFilter.h:441
PeptideEvidence argument_type
Definition IDFilter.h:436
ProteaseDigestion & digestion_
Definition IDFilter.h:440
bool methionine_cleavage_
Definition IDFilter.h:442
Builds a map index of data that have a String index to find matches and return the objects.
Definition IDFilter.h:309
std::map< String, Entry * > ItemMap
Definition IDFilter.h:311
GetMatchingItems()
Definition IDFilter.h:322
const String & getHitKey(const PeptideEvidence &p) const
Definition IDFilter.h:336
ItemMap items
Definition IDFilter.h:312
const String & getKey(const FASTAFile::FASTAEntry &entry) const
Definition IDFilter.h:326
HitType argument_type
Definition IDFilter.h:310
bool exists(const HitType &hit) const
Definition IDFilter.h:331
GetMatchingItems(std::vector< Entry > &records)
Definition IDFilter.h:314
const Entry & getValue(const PeptideEvidence &evidence) const
Definition IDFilter.h:341
Is this a decoy hit?
Definition IDFilter.h:223
bool operator()(const HitType &hit) const
Operator to check if a HitType object has decoy annotation.
Definition IDFilter.h:247
HitType argument_type
Definition IDFilter.h:224
HasDecoyAnnotation()
Default constructor.
Definition IDFilter.h:233
Is the score of this hit at least as good as the given value?
Definition IDFilter.h:93
bool operator()(const HitType &hit) const
Definition IDFilter.h:103
double score
Definition IDFilter.h:96
HitType argument_type
Definition IDFilter.h:94
HasGoodScore(double score_, bool higher_score_better_)
Definition IDFilter.h:99
bool higher_score_better
Definition IDFilter.h:97
Given a list of protein accessions, do any occur in the annotation(s) of this hit?
Definition IDFilter.h:265
HasMatchingAccessionImpl(const SetType &accessions_)
Definition IDFilter.h:270
const SetType & accessions
Definition IDFilter.h:268
HitType argument_type
Definition IDFilter.h:266
bool operator()(const PeptideHit &hit) const
Definition IDFilter.h:274
bool operator()(const PeptideEvidence &evidence) const
Definition IDFilter.h:289
bool operator()(const ProteinHit &hit) const
Definition IDFilter.h:284
Does a meta value of this hit have at most the given value?
Definition IDFilter.h:142
bool operator()(const HitType &hit) const
Definition IDFilter.h:152
HasMaxMetaValue(const String &key_, const double &value_)
Definition IDFilter.h:148
HitType argument_type
Definition IDFilter.h:143
String key
Definition IDFilter.h:145
double value
Definition IDFilter.h:146
Is a meta value with given key and value set on this hit?
Definition IDFilter.h:119
bool operator()(const HitType &hit) const
Definition IDFilter.h:129
DataValue value
Definition IDFilter.h:123
HitType argument_type
Definition IDFilter.h:120
HasMetaValue(const String &key_, const DataValue &value_)
Definition IDFilter.h:125
String key
Definition IDFilter.h:122
Predicate to check if a HitType object has a minimum meta value.
Definition IDFilter.h:170
bool operator()(const HitType &hit) const
Operator() function to check if a HitType object has a minimum meta value.
Definition IDFilter.h:194
HitType argument_type
Definition IDFilter.h:171
String key
Definition IDFilter.h:173
HasMinMetaValue(const String &key_, const double &value_)
Constructor for HasMinMetaValue.
Definition IDFilter.h:182
double value
Definition IDFilter.h:174
Is the list of hits of this peptide/protein ID empty?
Definition IDFilter.h:490
bool operator()(const IdentificationType &id) const
Definition IDFilter.h:493
IdentificationType argument_type
Definition IDFilter.h:491
Wrapper that adds operator< to iterators, so they can be used as (part of) keys in maps/sets or multi...
Definition MetaData.h:20