OpenMS  2.7.0
MRMAssay.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2021.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: George Rosenberger $
32 // $Authors: George Rosenberger $
33 // --------------------------------------------------------------------------
34 
35 #pragma once
36 
42 
43 #include <boost/bind.hpp>
44 #include <boost/lexical_cast.hpp>
45 #include <boost/random/mersenne_twister.hpp>
46 #include <boost/random/uniform_int.hpp>
47 #include <boost/random/variate_generator.hpp>
48 
49 // #define DEBUG_MRMASSAY
50 
51 namespace OpenMS
52 {
68  class OPENMS_DLLAPI MRMAssay :
69  public ProgressLogger
70  {
71 
72 public:
74  MRMAssay(); // empty, no members
76 
80 
81  typedef std::vector<OpenMS::TargetedExperiment::Protein> ProteinVectorType;
82  typedef std::vector<OpenMS::TargetedExperiment::Peptide> PeptideVectorType;
83  typedef std::vector<OpenMS::TargetedExperiment::Compound> CompoundVectorType;
84  typedef std::vector<OpenMS::ReactionMonitoringTransition> TransitionVectorType;
85 
86  typedef std::map<String, std::vector<const ReactionMonitoringTransition*> > PeptideTransitionMapType;
87  typedef std::map<String, std::vector<const ReactionMonitoringTransition*> > CompoundTransitionMapType;
88 
89  typedef boost::unordered_map<String, std::set<std::string> > ModifiedSequenceMap;
90  typedef boost::unordered_map<size_t, ModifiedSequenceMap> SequenceMapT;
91 
92  typedef std::vector<std::pair<double, std::string> > FragmentSeqMap;
93  typedef boost::unordered_map<size_t, boost::unordered_map<String, FragmentSeqMap > > IonMapT;
94 
95  typedef std::vector<std::pair<std::string, double> > IonSeries;
96  typedef std::map<String, IonSeries > PeptideMapT;
97 
98  typedef boost::unordered_map<String, TargetedExperiment::Peptide> TargetDecoyMapT;
99 
114  double precursor_mz_threshold,
115  double product_mz_threshold,
116  const std::vector<String>& fragment_types,
117  const std::vector<size_t>& fragment_charges,
118  bool enable_specific_losses,
119  bool enable_unspecific_losses,
120  int round_decPow = -4);
121 
133  double lower_mz_limit, double upper_mz_limit,
134  const std::vector<std::pair<double, double> >& swathes);
135 
144  void detectingTransitions(OpenMS::TargetedExperiment& exp, int min_transitions, int max_transitions);
145 
180  const std::vector<String>& fragment_types,
181  const std::vector<size_t>& fragment_charges,
182  bool enable_specific_losses,
183  bool enable_unspecific_losses,
184  bool enable_ms2_precursors,
185  double mz_threshold,
186  const std::vector<std::pair<double, double> >& swathes,
187  int round_decPow = -4,
188  size_t max_num_alternative_localizations = 20,
189  int shuffle_seed = -1,
190  bool disable_decoy_transitions = false);
191 
200  void filterMinMaxTransitionsCompound(OpenMS::TargetedExperiment& exp, int min_transitions, int max_transitions);
201 
216 
217 protected:
218 
228  std::vector<std::string> getMatchingPeptidoforms_(const double fragment_ion,
229  const FragmentSeqMap& ions,
230  const double mz_threshold);
231 
240  int getSwath_(const std::vector<std::pair<double, double> >& swathes, const double precursor_mz);
241 
251  bool isInSwath_(const std::vector<std::pair<double, double> >& swathes, const double precursor_mz, const double product_mz);
252 
261  std::string getRandomSequence_(size_t sequence_size, boost::variate_generator<boost::mt19937&, boost::uniform_int<> > pseudoRNG);
262 
271  std::vector<std::vector<size_t> > nchoosekcombinations_(const std::vector<size_t>& n, size_t k);
272 
282  std::vector<OpenMS::AASequence> addModificationsSequences_(const std::vector<OpenMS::AASequence>& sequences,
283  const std::vector<std::vector<size_t> >& mods_combs,
284  const OpenMS::String& modification);
285 
297  std::vector<OpenMS::AASequence> generateTheoreticalPeptidoforms_(const OpenMS::AASequence& sequence);
298 
316  std::vector<OpenMS::AASequence> generateTheoreticalPeptidoformsDecoy_(const OpenMS::AASequence& sequence, const OpenMS::AASequence& decoy_sequence);
317 
332  const std::vector<String>& fragment_types,
333  const std::vector<size_t>& fragment_charges,
334  bool enable_specific_losses,
335  bool enable_unspecific_losses,
336  bool enable_ms2_precursors,
337  const std::vector<std::pair<double, double> >& swathes,
338  int round_decPow,
339  size_t max_num_alternative_localizations,
340  SequenceMapT& TargetSequenceMap,
341  IonMapT& TargetIonMap,
342  PeptideMapT& TargetPeptideMap);
343 
353  void generateDecoySequences_(const SequenceMapT& TargetSequenceMap,
354  boost::unordered_map<String, String>& DecoySequenceMap,
355  int shuffle_seed);
356 
369  const std::vector<String>& fragment_types,
370  const std::vector<size_t>& fragment_charges,
371  bool enable_specific_losses,
372  bool enable_unspecific_losses,
373  bool enable_ms2_precursors,
374  const std::vector<std::pair<double, double> >& swathes,
375  int round_decPow,
376  TargetDecoyMapT& TargetDecoyMap,
377  PeptideMapT& TargetPeptideMap,
378  boost::unordered_map<String, String>& DecoySequenceMap,
379  IonMapT& DecoyIonMap,
380  PeptideMapT& DecoyPeptideMap);
381 
401  TransitionVectorType& transitions,
402  double mz_threshold,
403  const std::vector<std::pair<double, double> >& swathes,
404  int round_decPow,
405  const PeptideMapT& TargetPeptideMap,
406  const IonMapT& TargetIonMap);
407 
415  TransitionVectorType& transitions,
416  double mz_threshold,
417  const std::vector<std::pair<double, double> >& swathes,
418  int round_decPow,
419  const PeptideMapT& DecoyPeptideMap,
420  TargetDecoyMapT& TargetDecoyMap,
421  const IonMapT& DecoyIonMap,
422  const IonMapT& TargetIonMap);
423 
424  };
425 }
Representation of a peptide/protein sequence.
Definition: AASequence.h:112
Generate assays from a TargetedExperiment.
Definition: MRMAssay.h:70
void generateTargetAssays_(const OpenMS::TargetedExperiment &exp, TransitionVectorType &transitions, double mz_threshold, const std::vector< std::pair< double, double > > &swathes, int round_decPow, const PeptideMapT &TargetPeptideMap, const IonMapT &TargetIonMap)
Generate target identification transitions.
std::vector< OpenMS::AASequence > generateTheoreticalPeptidoformsDecoy_(const OpenMS::AASequence &sequence, const OpenMS::AASequence &decoy_sequence)
Generate alternative modified peptide forms according to ModificationsDB.
std::vector< OpenMS::TargetedExperiment::Compound > CompoundVectorType
Definition: MRMAssay.h:83
std::vector< std::vector< size_t > > nchoosekcombinations_(const std::vector< size_t > &n, size_t k)
Computes all N choose K combinations.
void generateDecoyInSilicoMap_(const OpenMS::TargetedExperiment &exp, const std::vector< String > &fragment_types, const std::vector< size_t > &fragment_charges, bool enable_specific_losses, bool enable_unspecific_losses, bool enable_ms2_precursors, const std::vector< std::pair< double, double > > &swathes, int round_decPow, TargetDecoyMapT &TargetDecoyMap, PeptideMapT &TargetPeptideMap, boost::unordered_map< String, String > &DecoySequenceMap, IonMapT &DecoyIonMap, PeptideMapT &DecoyPeptideMap)
Generate decoy in silico map.
void detectingTransitions(OpenMS::TargetedExperiment &exp, int min_transitions, int max_transitions)
Select detecting fragment ions.
std::vector< OpenMS::AASequence > addModificationsSequences_(const std::vector< OpenMS::AASequence > &sequences, const std::vector< std::vector< size_t > > &mods_combs, const OpenMS::String &modification)
Generate modified peptide forms based on all possible combinations.
std::map< String, std::vector< const ReactionMonitoringTransition * > > CompoundTransitionMapType
Definition: MRMAssay.h:87
void restrictTransitions(OpenMS::TargetedExperiment &exp, double lower_mz_limit, double upper_mz_limit, const std::vector< std::pair< double, double > > &swathes)
Restrict and filter transitions in a TargetedExperiment.
std::map< String, std::vector< const ReactionMonitoringTransition * > > PeptideTransitionMapType
Definition: MRMAssay.h:86
int getSwath_(const std::vector< std::pair< double, double > > &swathes, const double precursor_mz)
Get swath index (precursor isolation window ordinal) for a particular precursor.
boost::unordered_map< size_t, boost::unordered_map< String, FragmentSeqMap > > IonMapT
Stores a mapping : "unmodified sequence" -> FragmentSeqMap for all SWATH windows.
Definition: MRMAssay.h:93
void generateDecoyAssays_(const OpenMS::TargetedExperiment &exp, TransitionVectorType &transitions, double mz_threshold, const std::vector< std::pair< double, double > > &swathes, int round_decPow, const PeptideMapT &DecoyPeptideMap, TargetDecoyMapT &TargetDecoyMap, const IonMapT &DecoyIonMap, const IonMapT &TargetIonMap)
Generate decoy assays.
std::vector< OpenMS::ReactionMonitoringTransition > TransitionVectorType
Definition: MRMAssay.h:84
std::vector< std::pair< double, std::string > > FragmentSeqMap
Describes a fragment sequence map of : "fragment m/z" -> "modified sequence".
Definition: MRMAssay.h:92
void generateTargetInSilicoMap_(const OpenMS::TargetedExperiment &exp, const std::vector< String > &fragment_types, const std::vector< size_t > &fragment_charges, bool enable_specific_losses, bool enable_unspecific_losses, bool enable_ms2_precursors, const std::vector< std::pair< double, double > > &swathes, int round_decPow, size_t max_num_alternative_localizations, SequenceMapT &TargetSequenceMap, IonMapT &TargetIonMap, PeptideMapT &TargetPeptideMap)
Generate target in silico map.
std::string getRandomSequence_(size_t sequence_size, boost::variate_generator< boost::mt19937 &, boost::uniform_int<> > pseudoRNG)
Generates random peptide sequence.
std::vector< OpenMS::TargetedExperiment::Peptide > PeptideVectorType
Definition: MRMAssay.h:82
std::vector< std::pair< std::string, double > > IonSeries
Describes an ion series: "ion_type" -> "fragment m/z".
Definition: MRMAssay.h:95
std::vector< OpenMS::AASequence > generateTheoreticalPeptidoforms_(const OpenMS::AASequence &sequence)
Generate alternative modified peptide forms according to ModificationsDB.
void filterMinMaxTransitionsCompound(OpenMS::TargetedExperiment &exp, int min_transitions, int max_transitions)
Filters target and decoy transitions by intensity, only keeping the top N transitions.
void generateDecoySequences_(const SequenceMapT &TargetSequenceMap, boost::unordered_map< String, String > &DecoySequenceMap, int shuffle_seed)
Generate decoy sequences.
~MRMAssay()
Destructor.
std::map< String, IonSeries > PeptideMapT
Maps a peptide sequence to an ion series: "ion_type" -> "fragment m/z".
Definition: MRMAssay.h:96
boost::unordered_map< size_t, ModifiedSequenceMap > SequenceMapT
Stores the ModifiedSequenceMap for all SWATH windows.
Definition: MRMAssay.h:90
void filterUnreferencedDecoysCompound(OpenMS::TargetedExperiment &exp)
Filters decoy transitions, which do not have respective target transition based on the transitionID.
std::vector< OpenMS::TargetedExperiment::Protein > ProteinVectorType
Definition: MRMAssay.h:81
void uisTransitions(OpenMS::TargetedExperiment &exp, const std::vector< String > &fragment_types, const std::vector< size_t > &fragment_charges, bool enable_specific_losses, bool enable_unspecific_losses, bool enable_ms2_precursors, double mz_threshold, const std::vector< std::pair< double, double > > &swathes, int round_decPow=-4, size_t max_num_alternative_localizations=20, int shuffle_seed=-1, bool disable_decoy_transitions=false)
Annotate UIS / site-specific transitions.
void reannotateTransitions(OpenMS::TargetedExperiment &exp, double precursor_mz_threshold, double product_mz_threshold, const std::vector< String > &fragment_types, const std::vector< size_t > &fragment_charges, bool enable_specific_losses, bool enable_unspecific_losses, int round_decPow=-4)
Annotates and filters transitions in a TargetedExperiment.
std::vector< std::string > getMatchingPeptidoforms_(const double fragment_ion, const FragmentSeqMap &ions, const double mz_threshold)
Check whether fragment ion are unique ion signatures in vector within threshold and return matching p...
bool isInSwath_(const std::vector< std::pair< double, double > > &swathes, const double precursor_mz, const double product_mz)
Check whether the product m/z of a transition falls into the precursor isolation window.
boost::unordered_map< String, TargetedExperiment::Peptide > TargetDecoyMapT
Maps the peptide id (same for target and decoy) to the decoy peptide object.
Definition: MRMAssay.h:98
boost::unordered_map< String, std::set< std::string > > ModifiedSequenceMap
Maps an unmodified sequence to all its modified sequences.
Definition: MRMAssay.h:89
Base class for all classes that want to report their progress.
Definition: ProgressLogger.h:55
A more convenient string class.
Definition: String.h:61
A description of a targeted experiment containing precursor and production ions.
Definition: TargetedExperiment.h:65
const double k
Definition: Constants.h:153
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:47