OpenMS
Loading...
Searching...
No Matches
XFDRAlgorithm.h
Go to the documentation of this file.
1// Copyright (c) 2002-present, OpenMS Inc. -- EKU Tuebingen, ETH Zurich, and FU Berlin
2// SPDX-License-Identifier: BSD-3-Clause
3//
4// --------------------------------------------------------------------------
5// $Maintainer: Eugen Netz $
6// $Authors: Lukas Zimmermann, Eugen Netz $
7// --------------------------------------------------------------------------
8
9#pragma once
10
19
20namespace OpenMS
21{
22
23 //-------------------------------------------------------------
24 // Doxygen docu
25 //-------------------------------------------------------------
26
38 class OPENMS_DLLAPI XFDRAlgorithm :
40 {
41
42 public:
43
45 enum class ExitCodes
46 {
47 EXECUTION_OK,
48 ILLEGAL_PARAMETERS,
49 UNEXPECTED_RESULT
50 };
51
54
56 ~XFDRAlgorithm() override;
57
66
72
73private:
74 void updateMembers_() override;
75
86
92 static void assignTypes_(PeptideHit& pep_id, StringList& types);
93
105 void fdr_xprophet_(std::map< std::string, Math::Histogram<> >& cum_histograms,
106 const std::string& targetclass, const std::string& decoyclass, const std::string& fulldecoyclass,
107 std::vector< double >& fdr, bool mono) const;
108
114 static void calc_qfdr_(const std::vector< double >& fdr, std::vector< double >& qfdr);
115
117
118 void writeArgumentsLog_() const;
119
120 std::string getId_(const PeptideHit& ph) const;
121
123 {
124 Size alpha_ions = Size(ph.getMetaValue("matched_linear_alpha")) + Size(ph.getMetaValue("matched_xlink_alpha"));
125 Size beta_ions = Size(ph.getMetaValue("matched_linear_beta")) + Size(ph.getMetaValue("matched_xlink_beta"));
126 return std::min(alpha_ions, beta_ions);
127 }
128
129 inline static void setIntraProtein_(PeptideHit& ph, const bool value)
130 {
131 ph.setMetaValue("XFDR:is_intraprotein", DataValue(value ? "true" : "false"));
132 }
133
134 inline static void setInterProtein_(PeptideHit& ph, const bool value)
135 {
136 ph.setMetaValue("XFDR:is_interprotein", DataValue(value ? "true" : "false"));
137 }
138
142 static bool isSameProtein_(
143 std::string prot1,
144 std::string prot2,
145 const std::string &decoy_string)
146 {
147 StringUtils::substitute(prot1, decoy_string, "");
148 StringUtils::substitute(prot2, decoy_string, "");
149 assert( ! StringUtils::hasSubstring(prot1, decoy_string));
150 assert( ! StringUtils::hasSubstring(prot2, decoy_string));
151 return prot1 == prot2;
152 }
153
154 // Score range for this of the tool
157
158 // unique top hits
159 std::vector<std::string> unique_ids_;
160 std::vector<double> unique_id_scores_;
161
162 // maps index of peptide id all_pep_ids_ to vector of cross link class
163 std::map<std::string, std::vector<std::string>> cross_link_classes_;
164
165 // Program arguments
166 std::string decoy_string_;
175
176 // Names of the class parameters
177 static const std::string param_decoy_string_;
178 static const std::string param_minborder_;
179 static const std::string param_maxborder_;
180 static const std::string param_mindeltas_;
181 static const std::string param_minionsmatched_;
182 static const std::string param_uniquexl_;
183 static const std::string param_no_qvalues_;
184 static const std::string param_minscore_;
185 static const std::string param_binsize_;
186
187 // Constants related to particular crosslink classes
188 static const std::string crosslink_class_intradecoys_;
190 static const std::string crosslink_class_interdecoys_;
192 static const std::string crosslink_class_monodecoys_;
193 static const std::string crosslink_class_intralinks_;
194 static const std::string crosslink_class_interlinks_;
195 static const std::string crosslink_class_monolinks_;
196 static const std::string crosslink_class_decoys_;
197 static const std::string crosslink_class_targets_;
200 };
201}
Class to hold strings, numeric values, lists of strings and lists of numeric values.
Definition DataValue.h:32
A base class for all classes handling default parameters.
Definition DefaultParamHandler.h:66
Representation of a histogram.
Definition Histogram.h:38
const DataValue & getMetaValue(const std::string &name) const
Returns the value corresponding to a string, or DataValue::EMPTY if not found.
void setMetaValue(const std::string &name, const DataValue &value)
Sets the DataValue corresponding to a name.
Represents a single spectrum match (candidate) for a specific tandem mass spectrum (MS/MS).
Definition PeptideHit.h:52
Container for peptide identifications from multiple spectra.
Definition PeptideIdentificationList.h:66
Base class for all classes that want to report their progress.
Definition ProgressLogger.h:27
Representation of a protein identification run.
Definition ProteinIdentification.h:55
Calculates false discovery rate estimates on crosslink identifications.
Definition XFDRAlgorithm.h:40
static const std::string crosslink_class_targets_
Definition XFDRAlgorithm.h:197
ExitCodes validateClassArguments() const
Checks whether the parameters of the object are valid.
bool arg_no_qvalues_
Definition XFDRAlgorithm.h:173
static const std::string param_mindeltas_
Definition XFDRAlgorithm.h:180
static const std::string crosslink_class_hybriddecoysintralinks_
Definition XFDRAlgorithm.h:198
static const std::string param_maxborder_
Definition XFDRAlgorithm.h:179
std::string getId_(const PeptideHit &ph) const
static void setIntraProtein_(PeptideHit &ph, const bool value)
Definition XFDRAlgorithm.h:129
static const std::string crosslink_class_hybriddecoysinterlinks_
Definition XFDRAlgorithm.h:199
static const std::string crosslink_class_interdecoys_
Definition XFDRAlgorithm.h:190
static void calc_qfdr_(const std::vector< double > &fdr, std::vector< double > &qfdr)
Calculates the qFDR values for the provided FDR values, assuming that the FDRs are sorted by score in...
static const std::string crosslink_class_decoys_
Definition XFDRAlgorithm.h:196
static const std::string crosslink_class_fulldecoysinterlinks_
Definition XFDRAlgorithm.h:191
static const std::string crosslink_class_fulldecoysintralinks_
Definition XFDRAlgorithm.h:189
void findTopUniqueHits_(PeptideIdentificationList &peptide_ids)
ExitCodes run(PeptideIdentificationList &peptide_ids, ProteinIdentification &protein_id)
Performs the main function of this class, the FDR estimation for cross-linked peptide experiments.
static const std::string param_minborder_
Definition XFDRAlgorithm.h:178
bool arg_uniquex_
Definition XFDRAlgorithm.h:172
double arg_minscore_
Definition XFDRAlgorithm.h:171
static const std::string crosslink_class_monolinks_
Definition XFDRAlgorithm.h:195
XFDRAlgorithm()
Default constructor.
static const std::string crosslink_class_intradecoys_
Definition XFDRAlgorithm.h:188
static const std::string crosslink_class_monodecoys_
Definition XFDRAlgorithm.h:192
static const std::string crosslink_class_intralinks_
Definition XFDRAlgorithm.h:193
double arg_mindeltas_
Definition XFDRAlgorithm.h:167
static const std::string crosslink_class_interlinks_
Definition XFDRAlgorithm.h:194
static const std::string param_uniquexl_
Definition XFDRAlgorithm.h:182
void initDataStructures_(PeptideIdentificationList &peptide_ids, ProteinIdentification &protein_id)
Prepares vector of PeptideIdentification such that it can be processed downstream....
static const std::string param_minionsmatched_
Definition XFDRAlgorithm.h:181
static const std::string param_binsize_
Definition XFDRAlgorithm.h:185
Int min_score_
Definition XFDRAlgorithm.h:155
std::vector< double > unique_id_scores_
Definition XFDRAlgorithm.h:160
void writeArgumentsLog_() const
static bool isSameProtein_(std::string prot1, std::string prot2, const std::string &decoy_string)
Determines whether the Peptide Evidences belong to the same protein, modulo decoy.
Definition XFDRAlgorithm.h:142
static Size getMinIonsMatched_(const PeptideHit &ph)
Definition XFDRAlgorithm.h:122
Int max_score_
Definition XFDRAlgorithm.h:156
static const std::string param_decoy_string_
Definition XFDRAlgorithm.h:177
static const std::string param_minscore_
Definition XFDRAlgorithm.h:184
static void setInterProtein_(PeptideHit &ph, const bool value)
Definition XFDRAlgorithm.h:134
void fdr_xprophet_(std::map< std::string, Math::Histogram<> > &cum_histograms, const std::string &targetclass, const std::string &decoyclass, const std::string &fulldecoyclass, std::vector< double > &fdr, bool mono) const
xprophet method for target hits counting as implemented in xProphet
void updateMembers_() override
This method is used to update extra member variables at the end of the setParameters() method.
std::vector< std::string > unique_ids_
Definition XFDRAlgorithm.h:159
ExitCodes
Exit codes.
Definition XFDRAlgorithm.h:46
static void assignTypes_(PeptideHit &pep_id, StringList &types)
Inspects a PeptideIdentification and assigns all cross-link types that this identification belongs to...
std::map< std::string, std::vector< std::string > > cross_link_classes_
Definition XFDRAlgorithm.h:163
double arg_minborder_
Definition XFDRAlgorithm.h:168
double arg_maxborder_
Definition XFDRAlgorithm.h:169
Int arg_minionsmatched_
Definition XFDRAlgorithm.h:170
std::string decoy_string_
Definition XFDRAlgorithm.h:166
double arg_binsize_
Definition XFDRAlgorithm.h:174
~XFDRAlgorithm() override
Default destructor.
static const std::string param_no_qvalues_
Definition XFDRAlgorithm.h:183
int Int
Signed integer type.
Definition Types.h:72
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition Types.h:97
std::vector< std::string > StringList
Vector of String.
Definition ListUtils.h:44
Main OpenMS namespace.
Definition openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19