51 #include <unordered_set>
96 template <
typename ContainerType,
typename PredicateType>
99 for (
auto it = container.begin(); it != container.end(); )
103 it = container.erase(it);
224 bool allow_missing =
false;
234 current_step_ref_(processing_steps_.end()), no_checks_(false)
376 return processing_softwares_;
382 return processing_steps_;
388 return db_search_params_;
394 return db_search_steps_;
406 return observations_;
418 return parent_groups_;
424 return identified_peptides_;
430 return identified_compounds_;
436 return identified_oligos_;
448 return observation_matches_;
454 return observation_match_groups_;
487 bool require_score =
false)
const;
500 template <
typename PredicateType>
503 auto count = observation_matches_.size();
505 if (count != observation_matches_.size()) cleanup();
515 template <
typename PredicateType>
518 auto count = parents_.size();
520 if (count != parents_.size()) cleanup();
523 template <
typename PredicateType>
526 for (
auto it = observations_.begin(); it != observations_.end(); ++it)
527 observations_.modify(it, func);
551 void cleanup(
bool require_observation_match =
true,
552 bool require_identified_sequence =
true,
553 bool require_parent_match =
true,
554 bool require_parent_group =
false,
555 bool require_match_group =
false);
593 template <
class ScoredProcessingResults>
595 bool all_elements =
false,
bool any_score =
false)
const
597 std::map<ScoreTypeRef, Size> score_counts;
601 for (
const auto& element : container)
603 for (
const auto& step : element.steps_and_scores)
605 for (
const auto& pair : step.scores)
607 score_counts[pair.first]++;
614 for (
const auto& element : container)
616 auto score_info = element.getMostRecentScore();
617 if (std::get<2>(score_info))
620 if (!all_elements)
return score_ref;
621 score_counts[score_ref]++;
625 if (score_counts.empty())
return score_types_.end();
626 auto pos = max_element(score_counts.begin(), score_counts.end());
691 steps_and_scores)
const;
713 template <
typename ElementType>
721 template <
typename ElementType>
729 template <
typename ElementType>
733 template <
typename ContainerType,
typename ElementType>
737 template <
typename ContainerType,
typename ElementType>
739 ContainerType& container,
const ElementType& element,
Definition: AdductInfo.h:43
Class to hold strings, numeric values, lists of strings and lists of numeric values.
Definition: DataValue.h:59
Definition: IdentificationData.h:113
ObservationRef registerObservation(const Observation &obs)
Register an observation (e.g. MS2 spectrum or feature)
IdentificationDataInternal::PeakAnnotations PeakAnnotations
Definition: IdentificationData.h:182
DBSearchParams db_search_params_
Definition: IdentificationData.h:652
ParentGroupSets parent_groups_
Definition: IdentificationData.h:659
IdentificationDataInternal::ParentMatches ParentMatches
Definition: IdentificationData.h:164
void calculateCoverages(bool check_molecule_length=false)
Calculate sequence coverages of parent sequences.
ProcessingSoftwares processing_softwares_
Definition: IdentificationData.h:650
IdentificationData(const IdentificationData &other)
Copy constructor.
std::unordered_set< uintptr_t > AddressLookup
Definition: IdentificationData.h:207
ProcessingSteps processing_steps_
Definition: IdentificationData.h:651
const DBSearchParams & getDBSearchParams() const
Return the registered database search parameters (immutable)
Definition: IdentificationData.h:386
IdentificationData(IdentificationData &&other) noexcept
Move constructor.
ObservationMatchGroups observation_match_groups_
Definition: IdentificationData.h:665
ObservationMatches observation_matches_
Definition: IdentificationData.h:664
void removeObservationMatchesIf(PredicateType &&func)
Helper function for filtering observation matches (e.g. PSMs) in IdentificationData.
Definition: IdentificationData.h:501
ScoreTypeRef findScoreType(const String &score_name) const
Look up a score type by name.
IdentificationDataInternal::ScoreTypes ScoreTypes
Definition: IdentificationData.h:144
const ProcessingSoftwares & getProcessingSoftwares() const
Return the registered data processing software (immutable)
Definition: IdentificationData.h:374
AdductRef registerAdduct(const AdductInfo &adduct)
Register an adduct.
AddressLookup observation_match_lookup_
Definition: IdentificationData.h:684
IdentificationDataInternal::IdentifiedOligos IdentifiedOligos
Definition: IdentificationData.h:177
const InputFiles & getInputFiles() const
Return the registered input files (immutable)
Definition: IdentificationData.h:368
MatchGroupRef registerObservationMatchGroup(const ObservationMatchGroup &group)
Register a group of observation matches that belong together.
AddressLookup observation_lookup_
Definition: IdentificationData.h:678
void removeMetaValue(const ObservationMatchRef ref, const String &key)
ProcessingStepRef registerProcessingStep(const ProcessingStep &step, SearchParamRef search_ref)
Register a database search step with associated parameters.
AddressLookup identified_oligo_lookup_
Definition: IdentificationData.h:683
IdentifiedOligos identified_oligos_
Definition: IdentificationData.h:662
const ObservationMatchGroups & getObservationMatchGroups() const
Return the registered groups of observation matches (immutable)
Definition: IdentificationData.h:452
const ParentSequences & getParentSequences() const
Return the registered parent sequences (immutable)
Definition: IdentificationData.h:410
bool no_checks_
Suppress validity checks in register... calls?
Definition: IdentificationData.h:675
void setMetaValue(const ObservationRef ref, const String &key, const DataValue &value)
Set a meta value on a stored observation.
const IdentifiedCompounds & getIdentifiedCompounds() const
Return the registered compounds (immutable)
Definition: IdentificationData.h:428
void addScore(ObservationMatchRef match_ref, ScoreTypeRef score_ref, double value)
Add a score to an input match (e.g. PSM)
IdentifiedCompoundRef registerIdentifiedCompound(const IdentifiedCompound &compound)
Register an identified compound (small molecule)
ObservationMatchRef registerObservationMatch(const ObservationMatch &match)
Register an observation match (e.g. peptide-spectrum match)
IdentificationDataInternal::Adducts Adducts
Definition: IdentificationData.h:184
IdentifiedOligoRef registerIdentifiedOligo(const IdentifiedOligo &oligo)
Register an identified RNA oligonucleotide.
bool empty() const
Return whether the data structure is empty (no data)
Adducts adducts_
Definition: IdentificationData.h:663
void setCurrentProcessingStep(ProcessingStepRef step_ref)
Set a data processing step that will apply to all subsequent "register..." calls.
IdentificationDataInternal::Observations Observations
Definition: IdentificationData.h:156
void swap(IdentificationData &other)
Swap contents with a second instance.
void setMetaValue(const ObservationMatchRef ref, const String &key, const DataValue &value)
Set a meta value on a stored observation match (e.g. PSM)
IdentificationData & operator=(IdentificationData &&other) noexcept
Move assignment operator.
IdentificationDataInternal::ParentSequences ParentSequences
Definition: IdentificationData.h:160
ScoreTypeRef registerScoreType(const ScoreType &score)
Register a score type.
IdentificationDataInternal::AppliedProcessingSteps AppliedProcessingSteps
Definition: IdentificationData.h:153
const ProcessingSteps & getProcessingSteps() const
Return the registered data processing steps (immutable)
Definition: IdentificationData.h:380
void applyToObservations(PredicateType &&func)
Definition: IdentificationData.h:524
const ParentGroupSets & getParentGroupSets() const
Return the registered parent sequence groupings (immutable)
Definition: IdentificationData.h:416
IdentificationDataInternal::InputFiles InputFiles
Definition: IdentificationData.h:124
std::pair< ObservationMatchRef, ObservationMatchRef > getMatchesForObservation(ObservationRef obs_ref) const
Get range of matches (cf. equal_range) for a given observation.
ProcessingStepRef registerProcessingStep(const ProcessingStep &step)
Register a data processing step.
IdentificationDataInternal::DBSearchParams DBSearchParams
Definition: IdentificationData.h:139
const ScoreTypes & getScoreTypes() const
Return the registered score types (immutable)
Definition: IdentificationData.h:398
IdentificationData()
Default constructor.
Definition: IdentificationData.h:233
IdentifiedCompounds identified_compounds_
Definition: IdentificationData.h:661
const IdentifiedOligos & getIdentifiedOligos() const
Return the registered identified oligonucleotides (immutable)
Definition: IdentificationData.h:434
IdentificationDataInternal::IdentifiedPeptides IdentifiedPeptides
Definition: IdentificationData.h:167
DBSearchSteps db_search_steps_
Definition: IdentificationData.h:655
ProcessingStepRef getCurrentProcessingStep()
Return the current processing step (set via setCurrentProcessingStep()).
ProcessingSoftwareRef registerProcessingSoftware(const ProcessingSoftware &software)
Register data processing software.
void checkParentMatches_(const ParentMatches &matches, MoleculeType expected_type) const
Helper function to check if all parent matches are valid.
Observations observations_
Definition: IdentificationData.h:657
IdentificationDataInternal::ProcessingSteps ProcessingSteps
Definition: IdentificationData.h:135
IdentificationDataInternal::DBSearchSteps DBSearchSteps
Definition: IdentificationData.h:141
void setMetaValue(const IdentifiedMolecule &var, const String &key, const DataValue &value)
Set a meta value on a stored identified molecule (variant)
ParentSequenceRef registerParentSequence(const ParentSequence &parent)
Register a parent sequence (e.g. protein or intact RNA)
const DBSearchSteps & getDBSearchSteps() const
Return the registered database search steps (immutable)
Definition: IdentificationData.h:392
ScoreTypes score_types_
Definition: IdentificationData.h:656
InputFiles input_files_
Definition: IdentificationData.h:649
IdentificationDataInternal::AdductOpt AdductOpt
Definition: IdentificationData.h:186
const Adducts & getAdducts() const
Return the registered adducts (immutable)
Definition: IdentificationData.h:440
IdentificationDataInternal::ParentGroupSets ParentGroupSets
Definition: IdentificationData.h:205
void mergeScoredProcessingResults_(ScoredProcessingResult &result, const ScoredProcessingResult &other, const RefTranslator &trans)
Helper function to merge scored processing results while updating references (to processing steps and...
ContainerType::iterator insertIntoMultiIndex_(ContainerType &container, const ElementType &element)
Helper function for adding entries (derived from ScoredProcessingResult) to a boost::multi_index_cont...
InputFileRef registerInputFile(const InputFile &file)
Register an input file.
IdentifiedPeptideRef registerIdentifiedPeptide(const IdentifiedPeptide &peptide)
Register an identified peptide.
AddressLookup identified_peptide_lookup_
Definition: IdentificationData.h:681
ContainerType::iterator insertIntoMultiIndex_(ContainerType &container, const ElementType &element, AddressLookup &lookup)
Variant of insertIntoMultiIndex_() that also updates a look-up table of valid references (addresses)
ProcessingStepRef current_step_ref_
Reference to the current data processing step (see setCurrentProcessingStep())
Definition: IdentificationData.h:668
void clear()
Clear all contents.
const IdentifiedPeptides & getIdentifiedPeptides() const
Return the registered identified peptides (immutable)
Definition: IdentificationData.h:422
void clearCurrentProcessingStep()
Cancel the effect of setCurrentProcessingStep().
std::vector< ObservationMatchRef > getBestMatchPerObservation(ScoreTypeRef score_ref, bool require_score=false) const
Return the best match for each observation, according to a given score type.
void cleanup(bool require_observation_match=true, bool require_identified_sequence=true, bool require_parent_match=true, bool require_parent_group=false, bool require_match_group=false)
Clean up the data structure after filtering parts of it.
IdentificationDataInternal::ProcessingSoftwares ProcessingSoftwares
Definition: IdentificationData.h:130
void removeParentSequencesIf(PredicateType &&func)
Helper function for filtering parent sequences (e.g. protein sequences) in IdentificationData.
Definition: IdentificationData.h:516
SearchParamRef registerDBSearchParam(const DBSearchParam ¶m)
Register database search parameters.
void checkScoreTypes_(const std::map< ScoreTypeRef, double > &scores) const
Helper function to check if all score types are valid.
const Observations & getObservations() const
Return the registered observations (immutable)
Definition: IdentificationData.h:404
AddressLookup parent_lookup_
Definition: IdentificationData.h:679
void checkAppliedProcessingSteps_(const AppliedProcessingSteps &steps_and_scores) const
Helper function to check if all applied processing steps are valid.
IdentificationDataInternal::ParentGroups ParentGroups
Definition: IdentificationData.h:200
AddressLookup identified_compound_lookup_
Definition: IdentificationData.h:682
RefTranslator merge(const IdentificationData &other)
Merge in data from another instance.
IdentificationDataInternal::ObservationMatchGroups ObservationMatchGroups
Definition: IdentificationData.h:195
IdentificationData & operator=(const IdentificationData &other)
Copy assignment operator.
const ObservationMatches & getObservationMatches() const
Return the registered observation matches (immutable)
Definition: IdentificationData.h:446
IdentificationDataInternal::IdentifiedCompounds IdentifiedCompounds
Definition: IdentificationData.h:172
IdentifiedPeptides identified_peptides_
Definition: IdentificationData.h:660
void registerParentGroupSet(const ParentGroupSet &groups)
Register a grouping of parent sequences (e.g. protein inference result)
ParentSequences parents_
Definition: IdentificationData.h:658
IdentificationDataInternal::ObservationMatches ObservationMatches
Definition: IdentificationData.h:189
ScoreTypeRef pickScoreType(const ScoredProcessingResults &container, bool all_elements=false, bool any_score=false) const
Definition: IdentificationData.h:594
Helper functor for adding processing steps to elements in a boost::multi_index_container structure.
Definition: IdentificationData.h:714
Helper functor for adding scores to elements in a boost::multi_index_container structure.
Definition: IdentificationData.h:722
Helper functor for removing invalid parent matches from elements in a boost::multi_index_container st...
Definition: IdentificationData.h:730
A more convenient string class.
Definition: String.h:60
std::map< ProcessingStepRef, SearchParamRef > DBSearchSteps
Definition: DBSearchParam.h:126
IteratorWrapper< ObservationMatchGroups::iterator > MatchGroupRef
Definition: ObservationMatchGroup.h:100
IteratorWrapper< IdentifiedCompounds::iterator > IdentifiedCompoundRef
Definition: IdentifiedCompound.h:81
IdentifiedSequence< NASequence > IdentifiedOligo
Definition: IdentifiedSequence.h:107
IteratorWrapper< IdentifiedOligos::iterator > IdentifiedOligoRef
Definition: IdentifiedSequence.h:125
boost::multi_index_container< Observation, boost::multi_index::indexed_by< boost::multi_index::ordered_unique< boost::multi_index::composite_key< Observation, boost::multi_index::member< Observation, InputFileRef, &Observation::input_file >, boost::multi_index::member< Observation, String, &Observation::data_id > > > > > Observations
Definition: Observation.h:95
boost::multi_index_container< ObservationMatch, boost::multi_index::indexed_by< boost::multi_index::ordered_unique< boost::multi_index::composite_key< ObservationMatch, boost::multi_index::member< ObservationMatch, ObservationRef, &ObservationMatch::observation_ref >, boost::multi_index::member< ObservationMatch, IdentifiedMolecule, &ObservationMatch::identified_molecule_var >, boost::multi_index::member< ObservationMatch, AdductOpt, &ObservationMatch::adduct_opt > > > > > ObservationMatches
Definition: ObservationMatch.h:150
std::optional< AdductRef > AdductOpt
Definition: ObservationMatch.h:70
std::set< ScoreType > ScoreTypes
Definition: ScoreType.h:91
IteratorWrapper< IdentifiedPeptides::iterator > IdentifiedPeptideRef
Definition: IdentifiedSequence.h:116
IteratorWrapper< ScoreTypes::iterator > ScoreTypeRef
Definition: ScoreType.h:92
IteratorWrapper< Adducts::iterator > AdductRef
Definition: ObservationMatch.h:69
std::set< DBSearchParam > DBSearchParams
Definition: DBSearchParam.h:124
IteratorWrapper< Observations::iterator > ObservationRef
Definition: Observation.h:96
boost::multi_index_container< AppliedProcessingStep, boost::multi_index::indexed_by< boost::multi_index::sequenced<>, boost::multi_index::ordered_unique< boost::multi_index::member< AppliedProcessingStep, std::optional< ProcessingStepRef >, &AppliedProcessingStep::processing_step_opt > > > > AppliedProcessingSteps
Definition: AppliedProcessingStep.h:133
IteratorWrapper< ObservationMatches::iterator > ObservationMatchRef
Definition: ObservationMatch.h:152
boost::multi_index_container< IdentifiedPeptide, boost::multi_index::indexed_by< boost::multi_index::ordered_unique< boost::multi_index::member< IdentifiedPeptide, AASequence, &IdentifiedPeptide::sequence > > > > IdentifiedPeptides
Definition: IdentifiedSequence.h:115
IteratorWrapper< ProcessingSoftwares::iterator > ProcessingSoftwareRef
Definition: ProcessingSoftware.h:68
IteratorWrapper< DBSearchParams::iterator > SearchParamRef
Definition: DBSearchParam.h:125
std::vector< PeptideHit::PeakAnnotation > PeakAnnotations
Definition: ObservationMatch.h:52
MoleculeType
Definition: MetaData.h:66
boost::multi_index_container< ParentSequence, boost::multi_index::indexed_by< boost::multi_index::ordered_unique< boost::multi_index::member< ParentSequence, String, &ParentSequence::accession > > > > ParentSequences
Definition: ParentSequence.h:120
std::vector< ParentGroupSet > ParentGroupSets
Definition: ParentGroup.h:82
boost::multi_index_container< ParentGroup, boost::multi_index::indexed_by< boost::multi_index::ordered_unique< boost::multi_index::member< ParentGroup, std::set< ParentSequenceRef >, &ParentGroup::parent_refs > > > > ParentGroups
Definition: ParentGroup.h:64
boost::multi_index_container< IdentifiedOligo, boost::multi_index::indexed_by< boost::multi_index::ordered_unique< boost::multi_index::member< IdentifiedOligo, NASequence, &IdentifiedOligo::sequence > > > > IdentifiedOligos
Definition: IdentifiedSequence.h:124
boost::multi_index_container< IdentifiedCompound, boost::multi_index::indexed_by< boost::multi_index::ordered_unique< boost::multi_index::member< IdentifiedCompound, String, &IdentifiedCompound::identifier > > > > IdentifiedCompounds
Definition: IdentifiedCompound.h:80
std::map< ParentSequenceRef, std::set< ParentMatch > > ParentMatches
mapping: parent sequence -> match information
Definition: ParentMatch.h:101
std::set< ProcessingStep > ProcessingSteps
Definition: ProcessingStep.h:88
std::set< ProcessingSoftware > ProcessingSoftwares
Definition: ProcessingSoftware.h:67
IteratorWrapper< ProcessingSteps::iterator > ProcessingStepRef
Definition: ProcessingStep.h:89
boost::multi_index_container< ObservationMatchGroup, boost::multi_index::indexed_by< boost::multi_index::ordered_unique< boost::multi_index::member< ObservationMatchGroup, std::set< ObservationMatchRef >, &ObservationMatchGroup::observation_match_refs > > > > ObservationMatchGroups
Definition: ObservationMatchGroup.h:99
IdentifiedSequence< AASequence > IdentifiedPeptide
Definition: IdentifiedSequence.h:106
IteratorWrapper< InputFiles::iterator > InputFileRef
Definition: include/OpenMS/METADATA/ID/InputFile.h:95
MassType
Definition: MetaData.h:74
IteratorWrapper< ParentSequences::iterator > ParentSequenceRef
Definition: ParentSequence.h:121
IteratorWrapper< ParentGroups::iterator > ParentGroupRef
Definition: ParentGroup.h:65
boost::multi_index_container< InputFile, boost::multi_index::indexed_by< boost::multi_index::ordered_unique< boost::multi_index::member< InputFile, String, &InputFile::name > > > > InputFiles
Definition: include/OpenMS/METADATA/ID/InputFile.h:94
std::set< AdductInfo, AdductCompare > Adducts
Definition: ObservationMatch.h:68
: Group of ambiguously identified parent sequences (e.g. protein group)
Definition: ParentGroup.h:51
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:48
Definition: AppliedProcessingStep.h:56
Parameters specific to a database search step.
Definition: DBSearchParam.h:48
Definition: IdentifiedCompound.h:49
Variant type holding Peptide/Compound/Oligo references and convenience functions.
Definition: IdentifiedMolecule.h:55
Representation of an identified sequence (peptide or oligonucleotide)
Definition: IdentifiedSequence.h:53
: Group of related (co-identified) input matches
Definition: ObservationMatchGroup.h:51
Representation of a search hit (e.g. peptide-spectrum match).
Definition: ObservationMatch.h:74
Representation of an observation, e.g. a spectrum or feature, in an input data file.
Definition: Observation.h:54
Set of groups of ambiguously identified parent sequences (e.g. results of running a protein inference...
Definition: ParentGroup.h:70
Meta data for the association between an identified molecule (e.g. peptide) and a parent sequence (e....
Definition: ParentMatch.h:46
Representation of a parent sequence that is identified only indirectly (e.g. a protein).
Definition: ParentSequence.h:50
Information about software used for data processing.
Definition: ProcessingSoftware.h:49
Data processing step that is applied to the data (e.g. database search, PEP calculation,...
Definition: ProcessingStep.h:48
Information about a score type.
Definition: ScoreType.h:46
Base class for ID data with scores and processing steps (and meta info)
Definition: ScoredProcessingResult.h:45
structure that maps references of corresponding objects after copying
Definition: IdentificationData.h:210
std::map< ObservationMatchRef, ObservationMatchRef > observation_match_refs
Definition: IdentificationData.h:222
std::map< ProcessingSoftwareRef, ProcessingSoftwareRef > processing_software_refs
Definition: IdentificationData.h:213
std::map< IdentifiedPeptideRef, IdentifiedPeptideRef > identified_peptide_refs
Definition: IdentificationData.h:218
IdentifiedMolecule translate(IdentifiedMolecule old) const
std::map< ParentSequenceRef, ParentSequenceRef > parent_sequence_refs
Definition: IdentificationData.h:217
ObservationMatchRef translate(ObservationMatchRef old) const
std::map< SearchParamRef, SearchParamRef > search_param_refs
Definition: IdentificationData.h:214
std::map< ScoreTypeRef, ScoreTypeRef > score_type_refs
Definition: IdentificationData.h:212
std::map< IdentifiedCompoundRef, IdentifiedCompoundRef > identified_compound_refs
Definition: IdentificationData.h:220
std::map< ProcessingStepRef, ProcessingStepRef > processing_step_refs
Definition: IdentificationData.h:215
std::map< AdductRef, AdductRef > adduct_refs
Definition: IdentificationData.h:221
std::map< ObservationRef, ObservationRef > observation_refs
Definition: IdentificationData.h:216
std::map< IdentifiedOligoRef, IdentifiedOligoRef > identified_oligo_refs
Definition: IdentificationData.h:219
std::map< InputFileRef, InputFileRef > input_file_refs
Definition: IdentificationData.h:211