OpenMS
ModificationsDB.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2023.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: Timo Sachsenberg $
32 // $Authors: Andreas Bertsch $
33 // --------------------------------------------------------------------------
34 
35 #pragma once
36 
40 
41 #include <set>
42 #include <memory> // unique_ptr
43 #include <unordered_map>
44 
45 namespace OpenMS
46 {
47  // forward declarations
48  class ResidueModification;
49  class Residue;
50 
75  class OPENMS_DLLAPI ModificationsDB
76  {
77 public:
78 
81 
83  static ModificationsDB* initializeModificationsDB(OpenMS::String unimod_file = "CHEMISTRY/unimod.xml", OpenMS::String psimod_file = "CHEMISTRY/PSI-MOD.obo", OpenMS::String xlmod_file = "CHEMISTRY/XLMOD.obo");
84 
86  static bool isInstantiated();
87 
88  friend class CrossLinksDB;
89  // for access to addNewModification_ (without checking presence)
90  friend class Residue;
91  friend class AASequence;
92 
95 
101 
110  void searchModifications(std::set<const ResidueModification*>& mods,
111  const String& mod_name,
112  const String& residue = "",
114 
125 
141  bool& multiple_matches,
142  const String& residue = "",
144 
159 
161  bool has(const String& modification) const;
162 
170  const ResidueModification* addModification(std::unique_ptr<ResidueModification> new_mod);
171 
180 
189  Size findModificationIndex(const String& mod_name) const;
190 
198  void searchModificationsByDiffMonoMass(std::vector<String>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
199  void searchModificationsByDiffMonoMass(std::vector<const ResidueModification*>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
200 
208  void searchModificationsByDiffMonoMassSorted(std::vector<String>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
209  void searchModificationsByDiffMonoMassSorted(std::vector<const ResidueModification*>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
210 
211 
232 
234  void getAllSearchModifications(std::vector<String>& modifications) const;
235 
237  void writeTSV(const String& filename);
238 
239  protected:
240 
242  static bool is_instantiated_;
243 
245  std::vector<ResidueModification*> mods_;
246 
248  std::unordered_map<String, std::set<const ResidueModification*> > modification_names_;
249 
264  bool residuesMatch_(const char residue, const ResidueModification* curr_mod) const;
265 
266 private:
267 
276  explicit ModificationsDB(const OpenMS::String& unimod_file = "CHEMISTRY/unimod.xml", const OpenMS::String& psimod_file = "CHEMISTRY/PSI-MOD.obo", const OpenMS::String& xlmod_file = "CHEMISTRY/XLMOD.obo");
277 
279  ModificationsDB(const ModificationsDB& residue_db);
280 
282  virtual ~ModificationsDB();
284 
291 
298 
304  void readFromOBOFile(const String& filename);
305 
307  void readFromUnimodXMLFile(const String& filename);
308  };
309 }
Representation of a peptide/protein sequence.
Definition: AASequence.h:112
Definition: CrossLinksDB.h:43
database which holds all residue modifications from UniMod
Definition: ModificationsDB.h:76
void searchModificationsByDiffMonoMass(std::vector< String > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
Collects all modifications with delta mass inside a tolerance window.
Size getNumberOfModifications() const
Returns the number of modifications read from the unimod.xml file.
static ModificationsDB * getInstance()
Returns a pointer to the modifications DB (singleton)
bool residuesMatch_(const char residue, const ResidueModification *curr_mod) const
Helper function to check if a residue matches the origin for a modification.
const ResidueModification * getBestModificationByDiffMonoMass(double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
Returns the best matching modification for the given delta mass and residue.
void writeTSV(const String &filename)
Writes tab separated entries: FullId,FullName,Origin,AA,TerminusSpecificity,DiffMonoMass (including h...
std::vector< ResidueModification * > mods_
Stores the modifications.
Definition: ModificationsDB.h:245
ModificationsDB & operator=(const ModificationsDB &aa)
Assignment operator.
void searchModificationsByDiffMonoMassSorted(std::vector< const ResidueModification * > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
const ResidueModification * addModification(const ResidueModification &new_mod)
Add a new modification to ModificationsDB. If the modification already exists (based on its fullID) i...
bool has(const String &modification) const
Returns true if the modification exists.
Size findModificationIndex(const String &mod_name) const
Returns the index of the modification in the mods_ vector; a unique name must be given.
void searchModificationsByDiffMonoMass(std::vector< const ResidueModification * > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
void searchModificationsByDiffMonoMassSorted(std::vector< String > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
Collects all modifications with delta mass inside a tolerance window and adds them sorted by mass dif...
const ResidueModification * searchModification(const ResidueModification &mod_in) const
Returns a pointer to an exact match of the given modification if present in the DB.
const ResidueModification * searchModificationsFast(const String &mod_name, bool &multiple_matches, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY) const
Returns the modification which has the given name as synonym (fast version)
static ModificationsDB * initializeModificationsDB(OpenMS::String unimod_file="CHEMISTRY/unimod.xml", OpenMS::String psimod_file="CHEMISTRY/PSI-MOD.obo", OpenMS::String xlmod_file="CHEMISTRY/XLMOD.obo")
Initializes the modification DB with non-default modification files (can only be done once)
void readFromUnimodXMLFile(const String &filename)
Adds modifications from a given file in Unimod XML format.
virtual ~ModificationsDB()
Destructor.
static bool isInstantiated()
Check whether ModificationsDB was instantiated before.
const ResidueModification * getModification(const String &mod_name, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY) const
Returns the modification with the given name.
const ResidueModification * getModification(Size index) const
Returns the modification with the given index. note: out-of-bounds check is only performed in debug m...
static bool is_instantiated_
Stores whether ModificationsDB was instantiated before.
Definition: ModificationsDB.h:242
const ResidueModification * addNewModification_(const ResidueModification &new_mod)
Add a new modification to ModificationsDB without checking if it was inside already.
ModificationsDB(const OpenMS::String &unimod_file="CHEMISTRY/unimod.xml", const OpenMS::String &psimod_file="CHEMISTRY/PSI-MOD.obo", const OpenMS::String &xlmod_file="CHEMISTRY/XLMOD.obo")
void searchModifications(std::set< const ResidueModification * > &mods, const String &mod_name, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY) const
Collects all modifications which have the given name as synonym.
ModificationsDB(const ModificationsDB &residue_db)
Copy constructor.
void readFromOBOFile(const String &filename)
Adds modifications from a given file in OBO format.
const ResidueModification * addModification(std::unique_ptr< ResidueModification > new_mod)
Add a new modification to ModificationsDB. If the modification already exists (based on its fullID) i...
void getAllSearchModifications(std::vector< String > &modifications) const
Collects all modifications that can be used for identification searches.
std::unordered_map< String, std::set< const ResidueModification * > > modification_names_
Stores the mappings of (unique) names to the modifications.
Definition: ModificationsDB.h:248
Representation of a modification on an amino acid residue.
Definition: ResidueModification.h:79
TermSpecificity
Position where the modification is allowed to occur.
Definition: ResidueModification.h:98
@ NUMBER_OF_TERM_SPECIFICITY
Definition: ResidueModification.h:104
Representation of an amino acid residue.
Definition: Residue.h:63
A more convenient string class.
Definition: String.h:60
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:48
sets the modification of AA at index by providing a pointer to a in the