OpenMS
Loading...
Searching...
No Matches
PeptideAndProteinQuant.h
Go to the documentation of this file.
1// Copyright (c) 2002-present, OpenMS Inc. -- EKU Tuebingen, ETH Zurich, and FU Berlin
2// SPDX-License-Identifier: BSD-3-Clause
3//
4// --------------------------------------------------------------------------
5// $Maintainer: Hendrik Weisser $
6// $Authors: Hendrik Weisser $
7// --------------------------------------------------------------------------
8
9#pragma once
10
18
19
20namespace OpenMS
21{
29 class OPENMS_DLLAPI PeptideAndProteinQuant :
31 {
32public:
33
35 typedef std::map<UInt64, double> SampleAbundances;
36
39 {
41 std::map<Int, std::map<String, std::map<Int, std::map<UInt, double>>>> abundances;
42
44 std::map<Int, std::map<String, std::map<Int, UInt64>>> psm_counts;
45
48
51
53 std::set<String> accessions;
54
56 Size psm_count = 0;
57
59 PeptideData() = default;
60 };
61
63 typedef std::map<AASequence, PeptideData> PeptideQuant;
64
67 {
69 std::map<String, SampleAbundances> peptide_abundances;
70
71 std::map<String, SampleAbundances> peptide_psm_counts;
72
74 std::map<String, std::map<UInt, double>> channel_level_abundances;
75
77 std::map<String, UInt64> file_level_psm_counts;
78
81
84
87
89 Size psm_count = 0;
90
92 ProteinData() = default;
93 };
94
96 typedef std::map<String, ProteinData> ProteinQuant;
97
100 {
103
106
109
111 Size quant_proteins, too_few_peptides;
112
114 Size quant_peptides, total_peptides;
115
117 Size quant_features, total_features, blank_features, ambig_features;
118
121 n_samples(0), quant_proteins(0), too_few_peptides(0),
122 quant_peptides(0), total_peptides(0), quant_features(0),
123 total_features(0), blank_features(0), ambig_features(0) {}
124 };
125
128
131
137 void readQuantData(FeatureMap& features, const ExperimentalDesign& ed);
138
144 void readQuantData(ConsensusMap& consensus, const ExperimentalDesign& ed);
145
151 void readQuantData(std::vector<ProteinIdentification>& proteins,
153 const ExperimentalDesign& ed);
154
166
167
176
177
178 std::map<OpenMS::String, OpenMS::String> mapAccessionToLeader(const OpenMS::ProteinIdentification& proteins) const;
179
182
185
188
191 const ProteinQuant& protein_quants,
192 ProteinIdentification& proteins,
193 bool remove_unquantified = true);
194
195private:
196
199
202
205
208
209
217
228 void quantifyFeature_(const FeatureHandle& feature,
229 size_t fraction,
230 const String& filename,
231 const PeptideHit& hit,
232 UInt channel_or_label);
233
242 const std::map<Int, std::map<String, std::map<Int, std::map<UInt, double>>>> & peptide_abundances,
243 std::tuple<size_t, String, size_t, UInt> & best);
244
250 template <typename T>
251 void orderBest_(const std::map<T, SampleAbundances> & abundances,
252 std::vector<T>& result)
253 {
254 typedef std::pair<Size, double> PairType;
255 std::multimap<PairType, T, std::greater<PairType> > order;
256 for (typename std::map<T, SampleAbundances>::const_iterator ab_it =
257 abundances.begin(); ab_it != abundances.end(); ++ab_it)
258 {
259 double total = 0.0;
260 for (SampleAbundances::const_iterator samp_it = ab_it->second.begin();
261 samp_it != ab_it->second.end(); ++samp_it)
262 {
263 total += samp_it->second;
264 }
265 if (total <= 0.0) continue; // not quantified
266 PairType key = std::make_pair(ab_it->second.size(), total);
267 order.insert(std::make_pair(key, ab_it->first));
268 }
269 result.clear();
270 for (typename std::multimap<PairType, T, std::greater<PairType> >::
271 iterator ord_it = order.begin(); ord_it != order.end(); ++ord_it)
272 {
273 result.push_back(ord_it->second);
274 }
275 }
276
277
278
283
292
301 std::vector<String> selectPeptidesForQuantification_(const String& protein_accession,
302 Size top_n,
303 bool fix_peptides);
304
312 double aggregateAbundances_(const std::vector<double>& abundances,
313 const String& method) const;
314
324 void calculateProteinAbundances_(const String& protein_accession,
325 const std::vector<String>& selected_peptides,
326 const String& aggregate_method,
327 Size top_n,
328 bool include_all);
329
341 const std::vector<String>& selected_peptides,
342 const String& aggregate_method,
343 Size top_n,
344 bool include_all,
345 const std::map<String, String>& accession_to_leader);
346
353
366 String getAccession_(const std::set<String>& pep_accessions,
367 const std::map<String, String>& accession_to_leader) const;
368
375
385 UInt channel_or_label,
386 const ExperimentalDesign& ed) const;
387
389 void updateMembers_() override;
390
391 }; // class
392
393} // namespace
A container for consensus elements.
Definition ConsensusMap.h:68
A base class for all classes handling default parameters.
Definition DefaultParamHandler.h:66
Representation of an experimental design in OpenMS. Instances can be loaded with the ExperimentalDesi...
Definition ExperimentalDesign.h:109
Representation of a Peak2D, RichPeak2D or Feature .
Definition FeatureHandle.h:36
A container for features.
Definition FeatureMap.h:82
Helper class for peptide and protein quantification based on feature data annotated with IDs.
Definition PeptideAndProteinQuant.h:31
void calculateFileAndChannelLevelProteinAbundances_(const String &protein_accession, const std::vector< String > &selected_peptides, const String &aggregate_method, Size top_n, bool include_all, const std::map< String, String > &accession_to_leader)
Calculate detailed protein abundances at channel level using selected peptides.
void readQuantData(ConsensusMap &consensus, const ExperimentalDesign &ed)
Read quantitative data from a consensus map.
void quantifyFeature_(const FeatureHandle &feature, size_t fraction, const String &filename, const PeptideHit &hit, UInt channel_or_label)
Gather quantitative information from a feature.
size_t getSampleIDFromFilenameAndChannel_(const String &filename, UInt channel_or_label, const ExperimentalDesign &ed) const
Map (filename, channel) to sample using ExperimentalDesign.
void annotateQuantificationsToProteins(const ProteinQuant &protein_quants, ProteinIdentification &proteins, bool remove_unquantified=true)
Annotate protein quant results as meta data to protein ids.
std::map< AASequence, PeptideData > PeptideQuant
Mapping: peptide sequence (modified) -> peptide data.
Definition PeptideAndProteinQuant.h:63
void readQuantData(FeatureMap &features, const ExperimentalDesign &ed)
Read quantitative data from a feature map.
std::map< String, ProteinData > ProteinQuant
Mapping: protein accession -> protein data.
Definition PeptideAndProteinQuant.h:96
ExperimentalDesign experimental_design_
Experimental design for filename/channel to sample mapping.
Definition PeptideAndProteinQuant.h:207
const PeptideQuant & getPeptideResults()
Get peptide abundance data.
void performIbaqNormalization_(const ProteinIdentification &proteins)
Perform iBAQ normalization on protein abundances.
void countPeptides_(PeptideIdentificationList &peptides)
Count the number of identifications (best hits only) of each peptide sequence.
void quantifyPeptides(const PeptideIdentificationList &peptides=PeptideIdentificationList())
Compute peptide abundances.
PeptideQuant pep_quant_
Peptide quantification data.
Definition PeptideAndProteinQuant.h:201
void transferPeptideDataToProteins_(const ProteinIdentification &proteins)
Transfer peptide-level quantitative data to protein-level data structures.
String getAccession_(const std::set< String > &pep_accessions, const std::map< String, String > &accession_to_leader) const
Get the "canonical" protein accession from the list of protein accessions of a peptide.
std::map< OpenMS::String, OpenMS::String > mapAccessionToLeader(const OpenMS::ProteinIdentification &proteins) const
~PeptideAndProteinQuant() override
Destructor.
Definition PeptideAndProteinQuant.h:130
void calculateProteinAbundances_(const String &protein_accession, const std::vector< String > &selected_peptides, const String &aggregate_method, Size top_n, bool include_all)
Calculate protein abundances for a single protein using selected peptides.
void readQuantData(std::vector< ProteinIdentification > &proteins, PeptideIdentificationList &peptides, const ExperimentalDesign &ed)
Read quantitative data from identification results (for quantification via spectral counting).
void updateMembers_() override
Clear all data when parameters are set.
double aggregateAbundances_(const std::vector< double > &abundances, const String &method) const
Aggregate abundances using the specified mathematical method.
const ProteinQuant & getProteinResults()
Get protein abundance data.
void normalizePeptides_()
Normalize peptide abundances across samples by (multiplicative) scaling to equal medians.
void quantifyProteins(const ProteinIdentification &proteins=ProteinIdentification())
Compute protein abundances.
Statistics stats_
Processing statistics for output in the end.
Definition PeptideAndProteinQuant.h:198
bool getBest_(const std::map< Int, std::map< String, std::map< Int, std::map< UInt, double > > > > &peptide_abundances, std::tuple< size_t, String, size_t, UInt > &best)
Determine fraction, filename, charge state, and channel of a peptide with the highest number of abund...
const Statistics & getStatistics()
Get summary statistics.
PeptideHit getAnnotation_(PeptideIdentificationList &peptides)
Get the "canonical" annotation (a single peptide hit) of a feature/consensus feature from the associa...
void orderBest_(const std::map< T, SampleAbundances > &abundances, std::vector< T > &result)
Order keys (charges/peptides for peptide/protein quantification) according to how many samples they a...
Definition PeptideAndProteinQuant.h:251
std::map< UInt64, double > SampleAbundances
Mapping: sample ID -> abundance.
Definition PeptideAndProteinQuant.h:35
ProteinQuant prot_quant_
Protein quantification data.
Definition PeptideAndProteinQuant.h:204
std::vector< String > selectPeptidesForQuantification_(const String &protein_accession, Size top_n, bool fix_peptides)
Select peptides for protein quantification based on filtering criteria.
PeptideAndProteinQuant()
Constructor.
Represents a single spectrum match (candidate) for a specific tandem mass spectrum (MS/MS).
Definition PeptideHit.h:52
Container for peptide identifications from multiple spectra.
Definition PeptideIdentificationList.h:66
Representation of a protein identification run.
Definition ProteinIdentification.h:54
A more convenient string class.
Definition String.h:34
int Int
Signed integer type.
Definition Types.h:72
unsigned int UInt
Unsigned integer type.
Definition Types.h:64
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition Types.h:97
Main OpenMS namespace.
Definition openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19
Quantitative and associated data for a peptide.
Definition PeptideAndProteinQuant.h:39
SampleAbundances total_psm_counts
spectral counting-based abundances
Definition PeptideAndProteinQuant.h:50
SampleAbundances total_abundances
mapping: sample -> total abundance
Definition PeptideAndProteinQuant.h:47
std::set< String > accessions
protein accessions for this peptide
Definition PeptideAndProteinQuant.h:53
std::map< Int, std::map< String, std::map< Int, UInt64 > > > psm_counts
mapping: fraction -> filename -> charge -> abundance
Definition PeptideAndProteinQuant.h:44
std::map< Int, std::map< String, std::map< Int, std::map< UInt, double > > > > abundances
mapping: fraction -> filename -> charge -> channel/label -> abundance
Definition PeptideAndProteinQuant.h:41
Quantitative and associated data for a protein.
Definition PeptideAndProteinQuant.h:67
SampleAbundances total_psm_counts
spectral counting-based abundances
Definition PeptideAndProteinQuant.h:83
SampleAbundances total_abundances
mapping: sample -> total abundance
Definition PeptideAndProteinQuant.h:80
std::map< String, std::map< UInt, double > > channel_level_abundances
mapping: filename -> channel/label -> abundance
Definition PeptideAndProteinQuant.h:74
std::map< String, UInt64 > file_level_psm_counts
mapping: filename -> PSM counts
Definition PeptideAndProteinQuant.h:77
std::map< String, SampleAbundances > peptide_psm_counts
Definition PeptideAndProteinQuant.h:71
std::map< String, SampleAbundances > peptide_abundances
mapping: peptide (unmodified) -> sample -> abundance
Definition PeptideAndProteinQuant.h:69
SampleAbundances total_distinct_peptides
number of distinct peptide sequences
Definition PeptideAndProteinQuant.h:86
Statistics for processing summary.
Definition PeptideAndProteinQuant.h:100
Size quant_proteins
protein statistics
Definition PeptideAndProteinQuant.h:111
Size quant_peptides
peptide statistics
Definition PeptideAndProteinQuant.h:114
Size n_samples
number of samples (or assays in mzTab terms)
Definition PeptideAndProteinQuant.h:102
Size n_fractions
number of fractions
Definition PeptideAndProteinQuant.h:105
Statistics()
constructor
Definition PeptideAndProteinQuant.h:120
Size n_ms_files
number of MS files
Definition PeptideAndProteinQuant.h:108
Size ambig_features
Definition PeptideAndProteinQuant.h:117