|
OpenMS
2.5.0
|
Go to the documentation of this file.
87 enum type {primary, secondary, primary_indistinguishable, secondary_indistinguishable} protein_type;
91 std::list<ProteinEntry *>
indis;
144 enum type {PeptideIdent, Consensus} input_type;
165 void resolveID(std::vector<PeptideIdentification> & peptide_identifications);
219 void countTargetDecoy(std::vector<MSDGroup> & msd_groups,
ConsensusMap & consensus);
227 void countTargetDecoy(std::vector<MSDGroup> & msd_groups, std::vector<PeptideIdentification> & peptide_nodes);
231 void setProteinData(std::vector<FASTAFile::FASTAEntry> & protein_data);
233 const std::vector<ResolverResult> & getResults();
239 static const PeptideHit & getPeptideHit(
const std::vector<PeptideIdentification> & peptide_nodes,
const PeptideEntry * peptide);
246 void computeIntensityOfMSD_(std::vector<MSDGroup> & msd_groups);
252 Size findPeptideEntry_(
String seq, std::vector<PeptideEntry> & nodes);
254 Size binarySearchNodes_(
String & seq, std::vector<PeptideEntry> & nodes,
Size start,
Size end);
256 Size includeMSMSPeptides_(std::vector<PeptideIdentification> & peptide_identifications, std::vector<PeptideEntry> & peptide_nodes);
259 Size includeMSMSPeptides_(
ConsensusMap & consensus, std::vector<PeptideEntry> & peptide_nodes);
261 void reindexingNodes_(std::vector<MSDGroup> & msd_groups, std::vector<Size> & reindexed_proteins, std::vector<Size> & reindexed_peptides);
263 void primaryProteins_(std::vector<PeptideEntry> & peptide_nodes, std::vector<Size> & reindexed_peptides);
264 void buildingMSDGroups_(std::vector<MSDGroup> & msd_groups, std::vector<ISDGroup> & isd_groups);
265 void buildingISDGroups_(std::vector<ProteinEntry> & protein_nodes, std::vector<PeptideEntry> & peptide_nodes,
266 std::vector<ISDGroup> & isd_groups);
std::vector< MSDGroup > * msds
Definition: ProteinResolver.h:139
std::map< AASequence, PeptideData > PeptideQuant
Mapping: peptide sequence (modified) -> peptide data.
Definition: PeptideAndProteinQuant.h:82
std::list< ProteinEntry * > indis
Definition: ProteinResolver.h:91
Stream class for writing to comma/tab/...-separated values files.
Definition: SVOutStream.h:54
Management and storage of parameters / INI files.
Definition: Param.h:73
void resolveID(std::vector< PeptideIdentification > &peptide_identifications)
Computing protein groups from peptide identifications OR consensus map.
Resolves shared peptides based on protein scores.
Definition: PeptideProteinResolution.h:86
void quantifyProteins(const ProteinIdentification &proteins=ProteinIdentification())
Compute protein abundances.
FASTAFile::FASTAEntry * fasta_entry
Definition: ProteinResolver.h:86
This class provides Input/Output functionality for feature maps.
Definition: FeatureXMLFile.h:68
float intensity
Definition: ProteinResolver.h:110
Size number_of_target
Definition: ProteinResolver.h:122
Size index
Definition: ProteinResolver.h:119
Int getCharge() const
returns the charge of the peptide
const Param & getParameters() const
Non-mutable access to the parameters.
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
OpenMS identification format (.idXML)
Definition: FileTypes.h:66
Size peptide_hit
Definition: ProteinResolver.h:105
bool experimental
Definition: ProteinResolver.h:109
std::list< PeptideEntry * > peptides
Definition: ProteinResolver.h:118
This class provides some basic file handling methods for text files.
Definition: TextFile.h:46
static String concatenate(const std::vector< T > &container, const String &glue="")
Concatenates all elements of the container and puts the glue string between elements.
Definition: ListUtils.h:193
type
Definition: ProteinResolver.h:144
static void load(const String &filename, std::vector< FASTAEntry > &data)
loads a FASTA file given by 'filename' and stores the information in 'data'
void setProteinIdentifications(const std::vector< ProteinIdentification > &protein_identifications)
sets the protein identifications
#define OPENMS_LOG_INFO
Macro if a information, e.g. a status should be reported.
Definition: LogStream.h:465
std::vector< ResolverResult > resolver_result_
Definition: ProteinResolver.h:243
Size number_of_decoy
Definition: ProteinResolver.h:121
double weight
Definition: ProteinResolver.h:88
void readQuantData(FeatureMap &features, const ExperimentalDesign &ed)
Read quantitative data from a feature map.
Definition: ProteinResolver.h:127
represents a peptide. First in silico. If experimental is set to true it is MS/MS derived.
Definition: ProteinResolver.h:99
representation of an msd group. Contains peptides, proteins and a pointer to its ISD group
Definition: ProteinResolver.h:115
Size isd_group
Definition: ProteinResolver.h:108
bool traversed
Definition: ProteinResolver.h:85
Representation of a protein identification run.
Definition: ProteinIdentification.h:71
void load(const String &filename, FeatureMap &feature_map)
loads the file with name filename into map and calls updateRanges().
Size msd_group
Definition: ProteinResolver.h:107
Merge files according to experimental design.
Definition: QuantitativeExperimentalDesign.h:56
Definition: ProteinResolver.h:144
Size n_samples
number of samples (or assays in mzTab terms)
Definition: PeptideAndProteinQuant.h:108
const AASequence & getSequence() const
returns the peptide sequence without trailing or following spaces
std::vector< PeptideIdentification > * peptide_identification
Definition: ProteinResolver.h:145
void load(const String &filename, std::vector< ProteinIdentification > &protein_ids, std::vector< PeptideIdentification > &peptide_ids)
Loads the identifications of an idXML file without identifier.
std::vector< PeptideEntry > * peptide_entries
Definition: ProteinResolver.h:141
String toString() const
returns the peptide as string with modifications embedded in brackets
std::map< String, ProteinData > ProteinQuant
Mapping: protein accession -> protein data.
Definition: PeptideAndProteinQuant.h:102
Exception indicating that an invalid parameter was handed over to an algorithm.
Definition: Exception.h:347
Log Stream Class.
Definition: LogStream.h:311
A container for features.
Definition: FeatureMap.h:95
std::vector< FASTAFile::FASTAEntry > protein_data_
Definition: ProteinResolver.h:244
Size number_of_experimental_peptides
Definition: ProteinResolver.h:95
static const PeptideHit & getPeptideHit(const ConsensusMap &consensus, const PeptideEntry *peptide)
static ExperimentalDesign fromConsensusMap(const ConsensusMap &c)
Extract experimental design from consensus map.
represents a protein from FASTA file
Definition: ProteinResolver.h:82
const std::vector< ProteinGroup > & getIndistinguishableProteins() const
Returns the indistinguishable proteins.
Statistics for processing summary.
Definition: PeptideAndProteinQuant.h:105
Base class for TOPP applications.
Definition: TOPPBase.h:144
Definition: ProteinResolver.h:135
std::vector< String > StringList
Vector of String.
Definition: ListUtils.h:70
std::vector< ISDGroup > * isds
Definition: ProteinResolver.h:138
This class provides Input functionality for ConsensusMaps and Output functionality for alignments and...
Definition: ConsensusXMLFile.h:61
const std::vector< ProteinIdentification > & getProteinIdentifications() const
non-mutable access to the protein identifications
String origin
Definition: ProteinResolver.h:111
const DataValue & getValue(const String &key) const
Returns a value of a parameter.
bool modifyStrings(bool modify)
Switch modification of strings (quoting/replacing of separators) on/off.
Not all required information provided.
Definition: Exception.h:195
std::vector< Size > * reindexed_proteins
Definition: ProteinResolver.h:143
const PeptideQuant & getPeptideResults()
Get peptide abundance data.
std::vector< Size > * reindexed_peptides
Definition: ProteinResolver.h:142
Helper class for peptide and protein quantification based on feature data annotated with IDs.
Definition: ProteinResolver.h:56
void resolveConsensus(ConsensusMap &consensus)
Computing protein groups from peptide identifications OR consensus map.
double getMonoWeight(Residue::ResidueType type=Residue::Full, Int charge=0) const
Representation of a peptide/protein sequence.
Definition: AASequence.h:113
File adapter for MzTab files.
Definition: MzTabFile.h:58
String sequence
Definition: ProteinResolver.h:103
String toUnmodifiedString() const
returns the peptide as string without any modifications or (e.g., "PEPTIDER")
std::list< ProteinEntry * > proteins
Definition: ProteinResolver.h:117
String identifier
Definition: ProteinResolver.h:137
const ColumnHeaders & getColumnHeaders() const
Non-mutable access to the file descriptions.
const std::vector< PeptideHit > & getHits() const
returns the peptide hits as const
A container for consensus elements.
Definition: ConsensusMap.h:79
Size isd_group
Definition: ProteinResolver.h:94
std::vector< ProteinEntry > * protein_entries
Definition: ProteinResolver.h:140
void setParameters(const Param ¶m)
Sets the parameters.
void load(const String &filename, bool trim_lines=false, Int first_n=-1, bool skip_empty_lines=false)
Loads data from a text file.
static FileTypes::Type getType(const String &filename)
Tries to determine the file type (by name or content)
Size msd_group
Definition: ProteinResolver.h:93
bool update(const Param &p_outdated, const bool add_unknown=false)
Rescue parameter values from p_outdated to current param.
Bundles multiple (e.g. indistinguishable) proteins in a group.
Definition: ProteinIdentification.h:81
Data model of MzTab files. Please see the official MzTab specification at https://code....
Definition: MzTab.h:855
FASTA entry type (identifier, description and sequence)
Definition: FASTAFile.h:76
ISDGroup * isd_group
Definition: ProteinResolver.h:120
float coverage
Definition: ProteinResolver.h:89
OpenMS feature file (.featureXML)
Definition: FileTypes.h:65
void load(const String &filename, ConsensusMap &map)
Loads a consensus map from file and calls updateRanges.
double getMZ() const
returns the MZ of the MS2 spectrum
void setProteinData(std::vector< FASTAFile::FASTAEntry > &protein_data)
void quantifyPeptides(const std::vector< PeptideIdentification > &peptides=std::vector< PeptideIdentification >())
Compute peptide abundances.
type
Definition: ProteinResolver.h:87
Represents the peptide hits for a spectrum.
Definition: PeptideIdentification.h:62
A base class for all classes handling default parameters.
Definition: DefaultParamHandler.h:91
static MzTab exportConsensusMapToMzTab(const ConsensusMap &consensus_map, const String &filename, const bool first_run_inference_only, const bool export_unidentified_features, const bool export_unassigned_ids, const bool export_subfeatures, const bool export_empty_pep_ids=false, const String &title="ConsensusMap export from OpenMS")
export linked peptide features aka consensus map
Size index
Definition: ProteinResolver.h:92
ConsensusMap * consensus_map
Definition: ProteinResolver.h:146
Type
Actual file types enum.
Definition: FileTypes.h:58
const std::vector< ProteinHit > & getHits() const
Returns the protein hits.
QString toQString() const
Conversion to Qt QString.
static const PeptideIdentification & getPeptideIdentification(const ConsensusMap &consensus, const PeptideEntry *peptide)
overloaded functions – return a const reference to a PeptideIdentification object or a peptideHit eit...
Used to load and store idXML files.
Definition: IdXMLFile.h:63
Size number_of_target_plus_decoy
Definition: ProteinResolver.h:123
double getScore() const
returns the PSM score
std::list< PeptideEntry * > peptides
Definition: ProteinResolver.h:84
const std::vector< ResolverResult > & getResults()
std::list< Size > msd_groups
Definition: ProteinResolver.h:132
A more convenient string class.
Definition: String.h:58
Representation of a peptide hit.
Definition: PeptideHit.h:54
double getRT() const
returns the RT of the MS2 spectrum where the identification occurred
Helper class for peptide and protein quantification based on feature data annotated with IDs.
Definition: PeptideAndProteinQuant.h:53
QuotingMethod
How to handle embedded quotes when quoting strings.
Definition: String.h:81
Representation of the Experimental Design in OpenMS. Instances can be loaded via the ExperimentalDesi...
Definition: ExperimentalDesign.h:85
static ExperimentalDesign fromFeatureMap(const FeatureMap &f)
Extract experimental design from feature map.
std::vector< ProteinHit >::iterator findHit(const String &accession)
Finds a protein hit by accession (returns past-the-end iterator if not found)
bool traversed
Definition: ProteinResolver.h:102
const ProteinQuant & getProteinResults()
Get protein abundance data.
unsigned getNumberOfSamples() const
static ExperimentalDesign fromIdentifications(const std::vector< ProteinIdentification > &proteins)
Extract experimental design from identifications.
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:46
const Statistics & getStatistics()
Get summary statistics.
const std::vector< ProteinIdentification > & getProteinIdentifications() const
non-mutable access to the protein identifications
A required parameter was not given.
Definition: TOPPBase.h:111
void buildGraph(ProteinIdentification &protein, const std::vector< PeptideIdentification > &peptides, bool skip_sort=false)
String & substitute(char from, char to)
Replaces all occurrences of the character from by the character to.
Size peptide_identification
Definition: ProteinResolver.h:104
void applyDesign2Resolver(ProteinResolver &resolver, TextFile &file, StringList &fileNames)
xxxxxxx
static void annotateQuantificationsToProteins(const ProteinQuant &protein_quants, ProteinIdentification &proteins, const UInt n_samples)
Annotate protein quant results as meta data to protein ids.
std::map< UInt64, double > SampleAbundances
Mapping: sample ID -> abundance.
Definition: PeptideAndProteinQuant.h:59
std::map< UInt64, ColumnHeader > ColumnHeaders
Definition: ConsensusMap.h:158
This class serves for reading in and writing FASTA files.
Definition: FASTAFile.h:64
int main(int argc, const char **argv)
Definition: INIFileEditor.cpp:73
enum OpenMS::ProteinResolver::ResolverResult::type input_type
void store(const String &filename, const MzTab &mz_tab) const
static ExperimentalDesign load(const String &tsv_file, bool require_spectra_files)
Loads an experimental design from a tabular separated file.
String identifier
Definition: FASTAFile.h:78