OpenMS
ModifiedPeptideGenerator.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2023.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: Timo Sachsenberg $
32 // $Authors: Timo Sachsenberg $
33 // --------------------------------------------------------------------------
34 
35 #pragma once
36 
39 
42 #include <vector>
43 #include <map>
44 #include <unordered_map>
45 #include <set>
46 
47 namespace OpenMS
48 {
49  class OPENMS_DLLAPI ModifiedPeptideGenerator
50  {
51  /*
52  * @brief Modifications can be generated and applied to AASequences.
53  */
54 
55  public:
56  // struct needed to wrap the template for pyOpenMS
57  struct MapToResidueType { std::unordered_map<const ResidueModification*, const Residue*> val; };
58 
69  static MapToResidueType getModifications(const StringList& modNames);
70 
71  // Applies fixed modifications to a single peptide
73  const MapToResidueType& fixed_mods,
74  AASequence& peptide);
75 
76  // Applies variable modifications to a single peptide. If keep_original is set the original (e.g. unmodified version) is also returned
78  const MapToResidueType& var_mods,
79  const AASequence& peptide,
80  Size max_variable_mods_per_peptide,
81  std::vector<AASequence>& all_modified_peptides,
82  bool keep_original=true);
83 
84  protected:
85  static const int N_TERM_MODIFICATION_INDEX; // magic constant to distinguish N_TERM only modifications from ANYWHERE modifications placed at N-term residue
86  static const int C_TERM_MODIFICATION_INDEX; // magic constant to distinguish C_TERM only modifications from ANYWHERE modifications placed at C-term residue
87 
88  // Lookup datastructure to allow lock-free generation of modified peptides
89  static MapToResidueType createResidueModificationToResidueMap_(const std::vector<const ResidueModification*>& mods);
90 
91  // Fast implementation of modification placement. No combinatoric placement is needed in this case - just every site is modified once by each compatible modification. Already modified residues are skipped
93  const MapToResidueType& var_mods,
94  const AASequence& peptide,
95  std::vector<AASequence>& all_modified_peptides,
96  bool keep_original=true);
97 
98  private:
100  static void applyAllModsAtIdxAndExtend_(std::vector<AASequence>& original_sequences, int idx_to_modify, const std::vector<const ResidueModification*>& mods, const MapToResidueType& var_mods);
102  static void applyModToPep_(AASequence& current_peptide, int current_index, const ResidueModification* m, const MapToResidueType& var_mods);
103  };
104 }
Representation of a peptide/protein sequence.
Definition: AASequence.h:112
Definition: ModifiedPeptideGenerator.h:50
static void applyVariableModifications(const MapToResidueType &var_mods, const AASequence &peptide, Size max_variable_mods_per_peptide, std::vector< AASequence > &all_modified_peptides, bool keep_original=true)
std::unordered_map< const ResidueModification *, const Residue * > val
Definition: ModifiedPeptideGenerator.h:57
static const int N_TERM_MODIFICATION_INDEX
Definition: ModifiedPeptideGenerator.h:85
static MapToResidueType getModifications(const StringList &modNames)
Retrieve modifications from strings.
static void applyModToPep_(AASequence &current_peptide, int current_index, const ResidueModification *m, const MapToResidueType &var_mods)
applies a modification m to the current_peptide at current_index. Overwrites mod if it exists....
static void applyAtMostOneVariableModification_(const MapToResidueType &var_mods, const AASequence &peptide, std::vector< AASequence > &all_modified_peptides, bool keep_original=true)
static const int C_TERM_MODIFICATION_INDEX
Definition: ModifiedPeptideGenerator.h:86
static void applyAllModsAtIdxAndExtend_(std::vector< AASequence > &original_sequences, int idx_to_modify, const std::vector< const ResidueModification * > &mods, const MapToResidueType &var_mods)
take a vector of AASequences original_sequences, and for each mod in mods, add a version with mod at ...
static void applyFixedModifications(const MapToResidueType &fixed_mods, AASequence &peptide)
static MapToResidueType createResidueModificationToResidueMap_(const std::vector< const ResidueModification * > &mods)
Definition: ModifiedPeptideGenerator.h:57
Representation of a modification on an amino acid residue.
Definition: ResidueModification.h:79
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
std::vector< String > StringList
Vector of String.
Definition: ListUtils.h:70
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:48