OpenMS
ConsensusIDAlgorithm.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2023.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: Hendrik Weisser $
32 // $Authors: Andreas Bertsch, Marc Sturm, Sven Nahnsen, Hendrik Weisser $
33 // --------------------------------------------------------------------------
34 
35 #pragma once
36 
39 #include <map>
40 #include <vector>
41 
42 namespace OpenMS
43 {
59  class OPENMS_DLLAPI ConsensusIDAlgorithm : public DefaultParamHandler
60  {
61  public:
72  void apply(std::vector<PeptideIdentification>& ids, const std::map<String, String>& se_info, Size number_of_runs = 0);
73 
74  void apply(std::vector<PeptideIdentification>& ids, Size number_of_runs = 0);
75 
78 
79  protected:
80  struct HitInfo {
82  std::vector<double> scores;
83  std::vector<String> types;
84  // in case too much information is stored, TD and evidence
85  // could be re-annotated with PeptideIndexer later
87  std::set<PeptideEvidence> evidence;
88  double final_score;
89  double support;
90  // TODO: we could gather spectrum_refs here as well,
91  // to support passing of spectrum_ref if ALL refs of a group are the same
92  // For now, we do it in the ConsensusID TOPP tool class in cases where we
93  // know that refs will be the same.
94  };
95 
97  typedef std::map<AASequence, HitInfo> SequenceGrouping;
98 
101 
104 
106  double min_support_;
107 
110 
113 
116 
124  virtual void apply_(std::vector<PeptideIdentification>& ids, const std::map<String, String>& se_info, SequenceGrouping& results) = 0;
125 
127  void updateMembers_() override;
128 
130  void compareChargeStates_(Int& recorded_charge, Int new_charge, const AASequence& peptide);
131 
132  private:
135 
138  };
139 
140 } // namespace OpenMS
Representation of a peptide/protein sequence.
Definition: AASequence.h:112
Abstract base class for all ConsensusID algorithms (that calculate a consensus from multiple ID runs)...
Definition: ConsensusIDAlgorithm.h:60
void compareChargeStates_(Int &recorded_charge, Int new_charge, const AASequence &peptide)
Compare (and possibly update) charge state information.
Size considered_hits_
Number of peptide hits considered per ID run (input parameter)
Definition: ConsensusIDAlgorithm.h:100
std::set< PeptideEvidence > evidence
Definition: ConsensusIDAlgorithm.h:87
double support
Definition: ConsensusIDAlgorithm.h:89
String target_decoy
Definition: ConsensusIDAlgorithm.h:86
std::vector< double > scores
Definition: ConsensusIDAlgorithm.h:82
Size number_of_runs_
Number of ID runs.
Definition: ConsensusIDAlgorithm.h:103
double min_support_
Fraction of required support by other ID runs (input parameter)
Definition: ConsensusIDAlgorithm.h:106
bool count_empty_
Count empty runs in "min_support" calculation? (input parameter)
Definition: ConsensusIDAlgorithm.h:109
Int charge
Definition: ConsensusIDAlgorithm.h:81
std::map< AASequence, HitInfo > SequenceGrouping
Mapping: peptide sequence -> (charge, scores)
Definition: ConsensusIDAlgorithm.h:97
bool keep_old_scores_
Keep old scores?
Definition: ConsensusIDAlgorithm.h:112
ConsensusIDAlgorithm()
Default constructor.
double final_score
Definition: ConsensusIDAlgorithm.h:88
virtual void apply_(std::vector< PeptideIdentification > &ids, const std::map< String, String > &se_info, SequenceGrouping &results)=0
Consensus computation (to be implemented by subclasses).
void apply(std::vector< PeptideIdentification > &ids, Size number_of_runs=0)
void updateMembers_() override
Docu in base class.
ConsensusIDAlgorithm(const ConsensusIDAlgorithm &)=delete
Not implemented.
std::vector< String > types
Definition: ConsensusIDAlgorithm.h:83
void apply(std::vector< PeptideIdentification > &ids, const std::map< String, String > &se_info, Size number_of_runs=0)
Calculates the consensus ID for a set of peptide identifications of one spectrum or (consensus) featu...
ConsensusIDAlgorithm & operator=(const ConsensusIDAlgorithm &)=delete
Not implemented.
~ConsensusIDAlgorithm() override
Virtual destructor.
Definition: ConsensusIDAlgorithm.h:80
A base class for all classes handling default parameters.
Definition: DefaultParamHandler.h:92
A more convenient string class.
Definition: String.h:60
int Int
Signed integer type.
Definition: Types.h:102
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:48