|
OpenMS
2.6.0
|
Go to the documentation of this file.
87 enum type {primary, secondary, primary_indistinguishable, secondary_indistinguishable} protein_type;
91 std::list<ProteinEntry *>
indis;
144 enum type {PeptideIdent, Consensus} input_type;
165 void resolveID(std::vector<PeptideIdentification> & peptide_identifications);
219 void countTargetDecoy(std::vector<MSDGroup> & msd_groups,
ConsensusMap & consensus);
227 void countTargetDecoy(std::vector<MSDGroup> & msd_groups, std::vector<PeptideIdentification> & peptide_nodes);
231 void setProteinData(std::vector<FASTAFile::FASTAEntry> & protein_data);
233 const std::vector<ResolverResult> & getResults();
239 static const PeptideHit & getPeptideHit(
const std::vector<PeptideIdentification> & peptide_nodes,
const PeptideEntry * peptide);
246 void computeIntensityOfMSD_(std::vector<MSDGroup> & msd_groups);
252 Size findPeptideEntry_(
String seq, std::vector<PeptideEntry> & nodes);
254 Size binarySearchNodes_(
String & seq, std::vector<PeptideEntry> & nodes,
Size start,
Size end);
256 Size includeMSMSPeptides_(std::vector<PeptideIdentification> & peptide_identifications, std::vector<PeptideEntry> & peptide_nodes);
259 Size includeMSMSPeptides_(
ConsensusMap & consensus, std::vector<PeptideEntry> & peptide_nodes);
261 void reindexingNodes_(std::vector<MSDGroup> & msd_groups, std::vector<Size> & reindexed_proteins, std::vector<Size> & reindexed_peptides);
263 void primaryProteins_(std::vector<PeptideEntry> & peptide_nodes, std::vector<Size> & reindexed_peptides);
264 void buildingMSDGroups_(std::vector<MSDGroup> & msd_groups, std::vector<ISDGroup> & isd_groups);
265 void buildingISDGroups_(std::vector<ProteinEntry> & protein_nodes, std::vector<PeptideEntry> & peptide_nodes,
266 std::vector<ISDGroup> & isd_groups);
OpenMS identification format (.idXML)
Definition: FileTypes.h:66
Int getCharge() const
returns the charge of the peptide
Base class for TOPP applications.
Definition: TOPPBase.h:144
Representation of an experimental design in OpenMS. Instances can be loaded with the ExperimentalDesi...
Definition: ExperimentalDesign.h:243
static ExperimentalDesign load(const String &tsv_file, bool require_spectra_files)
Loads an experimental design from a tabular separated file.
File adapter for MzTab files.
Definition: MzTabFile.h:58
Resolves shared peptides based on protein scores.
Definition: PeptideProteinResolution.h:86
Statistics for processing summary.
Definition: PeptideAndProteinQuant.h:117
represents a protein from FASTA file
Definition: ProteinResolver.h:82
QuotingMethod
How to handle embedded quotes when quoting strings.
Definition: String.h:82
std::list< ProteinEntry * > indis
Definition: ProteinResolver.h:91
Definition: ProteinResolver.h:135
std::list< PeptideEntry * > peptides
Definition: ProteinResolver.h:84
const std::vector< ProteinGroup > & getIndistinguishableProteins() const
Returns the indistinguishable proteins.
String identifier
Definition: ProteinResolver.h:137
void setProteinData(std::vector< FASTAFile::FASTAEntry > &protein_data)
std::vector< PeptideEntry > * peptide_entries
Definition: ProteinResolver.h:141
Size peptide_hit
Definition: ProteinResolver.h:105
const AASequence & getSequence() const
returns the peptide sequence without trailing or following spaces
bool modifyStrings(bool modify)
Switch modification of strings (quoting/replacing of separators) on/off.
String identifier
Definition: FASTAFile.h:78
bool traversed
Definition: ProteinResolver.h:102
std::vector< MSDGroup > * msds
Definition: ProteinResolver.h:139
String & substitute(char from, char to)
Replaces all occurrences of the character from by the character to.
This class serves for reading in and writing FASTA files.
Definition: FASTAFile.h:64
double weight
Definition: ProteinResolver.h:88
std::vector< ResolverResult > resolver_result_
Definition: ProteinResolver.h:243
enum OpenMS::ProteinResolver::ResolverResult::type input_type
A more convenient string class.
Definition: String.h:59
representation of an msd group. Contains peptides, proteins and a pointer to its ISD group
Definition: ProteinResolver.h:115
float intensity
Definition: ProteinResolver.h:110
static const PeptideIdentification & getPeptideIdentification(const ConsensusMap &consensus, const PeptideEntry *peptide)
overloaded functions – return a const reference to a PeptideIdentification object or a peptideHit eit...
void applyDesign2Resolver(ProteinResolver &resolver, TextFile &file, StringList &fileNames)
xxxxxxx
Size number_of_target
Definition: ProteinResolver.h:122
This class provides some basic file handling methods for text files.
Definition: TextFile.h:46
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
double getMonoWeight(Residue::ResidueType type=Residue::Full, Int charge=0) const
unsigned getNumberOfSamples() const
FASTAFile::FASTAEntry * fasta_entry
Definition: ProteinResolver.h:86
std::vector< ProteinHit >::iterator findHit(const String &accession)
Finds a protein hit by accession (returns past-the-end iterator if not found)
Data model of MzTab files. Please see the official MzTab specification at https://code....
Definition: MzTab.h:800
const DataValue & getValue(const String &key) const
Returns a value of a parameter.
String toString() const
returns the peptide as string with modifications embedded in brackets
Size number_of_experimental_peptides
Definition: ProteinResolver.h:95
Size n_samples
number of samples (or assays in mzTab terms)
Definition: PeptideAndProteinQuant.h:120
String toUnmodifiedString() const
returns the peptide as string without any modifications or (e.g., "PEPTIDER")
const PeptideQuant & getPeptideResults()
Get peptide abundance data.
Representation of a protein identification run.
Definition: ProteinIdentification.h:70
FASTA entry type (identifier, description and sequence)
Definition: FASTAFile.h:76
const Statistics & getStatistics()
Get summary statistics.
ISDGroup * isd_group
Definition: ProteinResolver.h:120
void quantifyPeptides(const std::vector< PeptideIdentification > &peptides=std::vector< PeptideIdentification >())
Compute peptide abundances.
bool traversed
Definition: ProteinResolver.h:85
A base class for all classes handling default parameters.
Definition: DefaultParamHandler.h:92
const std::vector< PeptideHit > & getHits() const
returns the peptide hits as const
static ExperimentalDesign fromConsensusMap(const ConsensusMap &c)
Extract experimental design from consensus map.
void load(const String &filename, std::vector< ProteinIdentification > &protein_ids, std::vector< PeptideIdentification > &peptide_ids)
Loads the identifications of an idXML file without identifier.
Exception indicating that an invalid parameter was handed over to an algorithm.
Definition: Exception.h:347
static String concatenate(const std::vector< T > &container, const String &glue="")
Concatenates all elements of the container and puts the glue string between elements.
Definition: ListUtils.h:193
static MzTab exportConsensusMapToMzTab(const ConsensusMap &consensus_map, const String &filename, const bool first_run_inference_only, const bool export_unidentified_features, const bool export_unassigned_ids, const bool export_subfeatures, const bool export_empty_pep_ids=false, const String &title="ConsensusMap export from OpenMS")
export linked peptide features aka consensus map
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:46
represents a peptide. First in silico. If experimental is set to true it is MS/MS derived.
Definition: ProteinResolver.h:99
Size msd_group
Definition: ProteinResolver.h:93
OpenMS feature file (.featureXML)
Definition: FileTypes.h:65
std::map< UInt64, double > SampleAbundances
Mapping: sample ID -> abundance.
Definition: PeptideAndProteinQuant.h:59
Size number_of_decoy
Definition: ProteinResolver.h:121
void readQuantData(FeatureMap &features, const ExperimentalDesign &ed)
Read quantitative data from a feature map.
Stream class for writing to comma/tab/...-separated values files.
Definition: SVOutStream.h:54
bool experimental
Definition: ProteinResolver.h:109
const std::vector< ResolverResult > & getResults()
const std::vector< ProteinIdentification > & getProteinIdentifications() const
non-mutable access to the protein identifications
const std::vector< ProteinHit > & getHits() const
Returns the protein hits.
std::vector< ISDGroup > * isds
Definition: ProteinResolver.h:138
std::vector< FASTAFile::FASTAEntry > protein_data_
Definition: ProteinResolver.h:244
void load(const String &filename, FeatureMap &feature_map)
loads the file with name filename into map and calls updateRanges().
Definition: ProteinResolver.h:144
Type
Actual file types enum.
Definition: FileTypes.h:58
Merge files according to experimental design.
Definition: QuantitativeExperimentalDesign.h:56
Size index
Definition: ProteinResolver.h:92
std::vector< Size > * reindexed_peptides
Definition: ProteinResolver.h:142
void store(const String &filename, const MzTab &mz_tab) const
static FileTypes::Type getType(const String &filename)
Tries to determine the file type (by name or content)
void setParameters(const Param ¶m)
Sets the parameters.
QString toQString() const
Conversion to Qt QString.
const Param & getParameters() const
Non-mutable access to the parameters.
Log Stream Class.
Definition: LogStream.h:311
A container for consensus elements.
Definition: ConsensusMap.h:80
std::vector< String > StringList
Vector of String.
Definition: ListUtils.h:70
void load(const String &filename, ConsensusMap &map)
Loads a consensus map from file and calls updateRanges.
std::list< Size > msd_groups
Definition: ProteinResolver.h:132
String sequence
Definition: ProteinResolver.h:103
int main(int argc, const char **argv)
Definition: INIFileEditor.cpp:73
void buildGraph(ProteinIdentification &protein, const std::vector< PeptideIdentification > &peptides, bool skip_sort=false)
Size index
Definition: ProteinResolver.h:119
type
Definition: ProteinResolver.h:144
std::list< ProteinEntry * > proteins
Definition: ProteinResolver.h:117
const ColumnHeaders & getColumnHeaders() const
Non-mutable access to the file descriptions.
Size isd_group
Definition: ProteinResolver.h:94
Size msd_group
Definition: ProteinResolver.h:107
bool update(const Param &p_outdated, const bool add_unknown=false)
Rescue parameter values from p_outdated to current param.
A required parameter was not given.
Definition: TOPPBase.h:111
const ProteinQuant & getProteinResults()
Get protein abundance data.
A container for features.
Definition: FeatureMap.h:97
Represents the peptide hits for a spectrum.
Definition: PeptideIdentification.h:62
double getMZ() const
returns the MZ of the MS2 spectrum
static void load(const String &filename, std::vector< FASTAEntry > &data)
loads a FASTA file given by 'filename' and stores the information in 'data'
std::vector< PeptideIdentification > * peptide_identification
Definition: ProteinResolver.h:145
double getScore() const
returns the PSM score
String origin
Definition: ProteinResolver.h:111
std::list< PeptideEntry * > peptides
Definition: ProteinResolver.h:118
static ExperimentalDesign fromFeatureMap(const FeatureMap &f)
Extract experimental design from feature map.
ConsensusMap * consensus_map
Definition: ProteinResolver.h:146
This class provides Input/Output functionality for feature maps.
Definition: FeatureXMLFile.h:68
void resolveConsensus(ConsensusMap &consensus)
Computing protein groups from peptide identifications OR consensus map.
std::vector< ProteinEntry > * protein_entries
Definition: ProteinResolver.h:140
Management and storage of parameters / INI files.
Definition: Param.h:73
Representation of a peptide/protein sequence.
Definition: AASequence.h:111
static ExperimentalDesign fromIdentifications(const std::vector< ProteinIdentification > &proteins)
Extract experimental design from identifications.
Definition: ProteinResolver.h:127
Size peptide_identification
Definition: ProteinResolver.h:104
static const PeptideHit & getPeptideHit(const ConsensusMap &consensus, const PeptideEntry *peptide)
#define OPENMS_LOG_INFO
Macro if a information, e.g. a status should be reported.
Definition: LogStream.h:465
float coverage
Definition: ProteinResolver.h:89
std::map< String, ProteinData > ProteinQuant
Mapping: protein accession -> protein data.
Definition: PeptideAndProteinQuant.h:114
std::vector< Size > * reindexed_proteins
Definition: ProteinResolver.h:143
Helper class for peptide and protein quantification based on feature data annotated with IDs.
Definition: ProteinResolver.h:56
void load(const String &filename, bool trim_lines=false, Int first_n=-1, bool skip_empty_lines=false)
Loads data from a text file.
type
Definition: ProteinResolver.h:87
Size isd_group
Definition: ProteinResolver.h:108
const std::vector< ProteinIdentification > & getProteinIdentifications() const
non-mutable access to the protein identifications
void quantifyProteins(const ProteinIdentification &proteins=ProteinIdentification())
Compute protein abundances.
This class provides Input functionality for ConsensusMaps and Output functionality for alignments and...
Definition: ConsensusXMLFile.h:62
Used to load and store idXML files.
Definition: IdXMLFile.h:63
double getRT() const
returns the RT of the MS2 spectrum where the identification occurred
static void annotateQuantificationsToProteins(const ProteinQuant &protein_quants, ProteinIdentification &proteins, const UInt n_samples, bool remove_unquantified=true)
Annotate protein quant results as meta data to protein ids.
std::map< UInt64, ColumnHeader > ColumnHeaders
Definition: ConsensusMap.h:168
Bundles multiple (e.g. indistinguishable) proteins in a group.
Definition: ProteinIdentification.h:117
Size number_of_target_plus_decoy
Definition: ProteinResolver.h:123
std::map< AASequence, PeptideData > PeptideQuant
Mapping: peptide sequence (modified) -> peptide data.
Definition: PeptideAndProteinQuant.h:87
Representation of a peptide hit.
Definition: PeptideHit.h:55
Helper class for peptide and protein quantification based on feature data annotated with IDs.
Definition: PeptideAndProteinQuant.h:53
void resolveID(std::vector< PeptideIdentification > &peptide_identifications)
Computing protein groups from peptide identifications OR consensus map.