OpenMS  2.8.0
ModificationsDB.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2021.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: Timo Sachsenberg $
32 // $Authors: Andreas Bertsch $
33 // --------------------------------------------------------------------------
34 
35 #pragma once
36 
41 
42 #include <set>
43 #include <memory> // unique_ptr
44 #include <unordered_map>
45 
46 namespace OpenMS
47 {
48  // forward declarations
49  class ResidueModification;
50  class Residue;
51 
76  class OPENMS_DLLAPI ModificationsDB
77  {
78 public:
79 
82 
84  static ModificationsDB* initializeModificationsDB(OpenMS::String unimod_file = "CHEMISTRY/unimod.xml", OpenMS::String psimod_file = "CHEMISTRY/PSI-MOD.obo", OpenMS::String xlmod_file = "CHEMISTRY/XLMOD.obo");
85 
87  static bool isInstantiated();
88 
89  friend class CrossLinksDB;
90  // for access to addNewModification_ (without checking presence)
91  friend class Residue;
92  friend class AASequence;
93 
96 
102 
111  void searchModifications(std::set<const ResidueModification*>& mods,
112  const String& mod_name,
113  const String& residue = "",
115 
126 
142  bool& multiple_matches,
143  const String& residue = "",
145 
160 
162  bool has(const String& modification) const;
163 
171  const ResidueModification* addModification(std::unique_ptr<ResidueModification> new_mod);
172 
181 
190  Size findModificationIndex(const String& mod_name) const;
191 
199  void searchModificationsByDiffMonoMass(std::vector<String>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
200  void searchModificationsByDiffMonoMass(std::vector<const ResidueModification*>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
201 
209  void searchModificationsByDiffMonoMassSorted(std::vector<String>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
210  void searchModificationsByDiffMonoMassSorted(std::vector<const ResidueModification*>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
211 
212 
233 
235  void getAllSearchModifications(std::vector<String>& modifications) const;
236 
238  void writeTSV(const String& filename);
239 
240  protected:
241 
243  static bool is_instantiated_;
244 
246  std::vector<ResidueModification*> mods_;
247 
249  std::unordered_map<String, std::set<const ResidueModification*> > modification_names_;
250 
265  bool residuesMatch_(const char residue, const ResidueModification* curr_mod) const;
266 
267 private:
268 
277  explicit ModificationsDB(OpenMS::String unimod_file = "CHEMISTRY/unimod.xml", OpenMS::String psimod_file = "CHEMISTRY/PSI-MOD.obo", OpenMS::String xlmod_file = "CHEMISTRY/XLMOD.obo");
278 
280  ModificationsDB(const ModificationsDB& residue_db);
281 
283  virtual ~ModificationsDB();
285 
292 
299 
305  void readFromOBOFile(const String& filename);
306 
308  void readFromUnimodXMLFile(const String& filename);
309  };
310 }
Representation of a peptide/protein sequence.
Definition: AASequence.h:112
Definition: CrossLinksDB.h:43
database which holds all residue modifications from UniMod
Definition: ModificationsDB.h:77
void searchModificationsByDiffMonoMass(std::vector< String > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
Collects all modifications with delta mass inside a tolerance window.
Size getNumberOfModifications() const
Returns the number of modifications read from the unimod.xml file.
static ModificationsDB * getInstance()
Returns a pointer to the modifications DB (singleton)
bool residuesMatch_(const char residue, const ResidueModification *curr_mod) const
Helper function to check if a residue matches the origin for a modification.
const ResidueModification * getBestModificationByDiffMonoMass(double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
Returns the best matching modification for the given delta mass and residue.
void writeTSV(const String &filename)
Writes tab separated entries: FullId,FullName,Origin,AA,TerminusSpecificity,DiffMonoMass (including h...
std::vector< ResidueModification * > mods_
Stores the modifications.
Definition: ModificationsDB.h:246
ModificationsDB & operator=(const ModificationsDB &aa)
Assignment operator.
void searchModificationsByDiffMonoMassSorted(std::vector< const ResidueModification * > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
const ResidueModification * addModification(const ResidueModification &new_mod)
Add a new modification to ModificationsDB. If the modification already exists (based on its fullID) i...
bool has(const String &modification) const
Returns true if the modification exists.
Size findModificationIndex(const String &mod_name) const
Returns the index of the modification in the mods_ vector; a unique name must be given.
void searchModificationsByDiffMonoMass(std::vector< const ResidueModification * > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
ModificationsDB(OpenMS::String unimod_file="CHEMISTRY/unimod.xml", OpenMS::String psimod_file="CHEMISTRY/PSI-MOD.obo", OpenMS::String xlmod_file="CHEMISTRY/XLMOD.obo")
void searchModificationsByDiffMonoMassSorted(std::vector< String > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
Collects all modifications with delta mass inside a tolerance window and adds them sorted by mass dif...
const ResidueModification * searchModification(const ResidueModification &mod_in) const
Returns a pointer to an exact match of the given modification if present in the DB.
const ResidueModification * searchModificationsFast(const String &mod_name, bool &multiple_matches, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY) const
Returns the modification which has the given name as synonym (fast version)
static ModificationsDB * initializeModificationsDB(OpenMS::String unimod_file="CHEMISTRY/unimod.xml", OpenMS::String psimod_file="CHEMISTRY/PSI-MOD.obo", OpenMS::String xlmod_file="CHEMISTRY/XLMOD.obo")
Initializes the modification DB with non-default modification files (can only be done once)
void readFromUnimodXMLFile(const String &filename)
Adds modifications from a given file in Unimod XML format.
virtual ~ModificationsDB()
Destructor.
static bool isInstantiated()
Check whether ModificationsDB was instantiated before.
const ResidueModification * getModification(const String &mod_name, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY) const
Returns the modification with the given name.
const ResidueModification * getModification(Size index) const
Returns the modification with the given index. note: out-of-bounds check is only performed in debug m...
static bool is_instantiated_
Stores whether ModificationsDB was instantiated before.
Definition: ModificationsDB.h:243
const ResidueModification * addNewModification_(const ResidueModification &new_mod)
Add a new modification to ModificationsDB without checking if it was inside already.
void searchModifications(std::set< const ResidueModification * > &mods, const String &mod_name, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY) const
Collects all modifications which have the given name as synonym.
ModificationsDB(const ModificationsDB &residue_db)
Copy constructor.
void readFromOBOFile(const String &filename)
Adds modifications from a given file in OBO format.
const ResidueModification * addModification(std::unique_ptr< ResidueModification > new_mod)
Add a new modification to ModificationsDB. If the modification already exists (based on its fullID) i...
void getAllSearchModifications(std::vector< String > &modifications) const
Collects all modifications that can be used for identification searches.
std::unordered_map< String, std::set< const ResidueModification * > > modification_names_
Stores the mappings of (unique) names to the modifications.
Definition: ModificationsDB.h:249
Representation of a modification.
Definition: ResidueModification.h:77
TermSpecificity
Position where the modification is allowed to occur.
Definition: ResidueModification.h:96
@ NUMBER_OF_TERM_SPECIFICITY
Definition: ResidueModification.h:102
Representation of a residue.
Definition: Residue.h:63
A more convenient string class.
Definition: String.h:60
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:47
sets the modification of AA at index by providing a pointer to a in the