OpenMS  2.7.0
ModificationsDB.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2021.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: Timo Sachsenberg $
32 // $Authors: Andreas Bertsch $
33 // --------------------------------------------------------------------------
34 
35 #pragma once
36 
40 
41 #include <set>
42 #include <memory> // unique_ptr
43 #include <unordered_map>
44 
45 namespace OpenMS
46 {
47  // forward declarations
48  class ResidueModification;
49  class Residue;
50 
75  class OPENMS_DLLAPI ModificationsDB
76  {
77 public:
78 
81 
83  static ModificationsDB* initializeModificationsDB(OpenMS::String unimod_file = "CHEMISTRY/unimod.xml", OpenMS::String psimod_file = "CHEMISTRY/PSI-MOD.obo", OpenMS::String xlmod_file = "CHEMISTRY/XLMOD.obo");
84 
86  static bool isInstantiated();
87 
88  friend class CrossLinksDB;
89 
92 
98 
106  void searchModifications(std::set<const ResidueModification*>& mods,
107  const String& mod_name,
108  const String& residue = "",
110 
126  bool& multiple_matches,
127  const String& residue = "",
129 
144 
146  bool has(const String& modification) const;
147 
155  const ResidueModification* addModification(std::unique_ptr<ResidueModification> new_mod);
156 
165  Size findModificationIndex(const String& mod_name) const;
166 
174  void searchModificationsByDiffMonoMass(std::vector<String>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
175  void searchModificationsByDiffMonoMass(std::vector<const ResidueModification*>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
176 
184  void searchModificationsByDiffMonoMassSorted(std::vector<String>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
185  void searchModificationsByDiffMonoMassSorted(std::vector<const ResidueModification*>& mods, double mass, double max_error, const String& residue = "", ResidueModification::TermSpecificity term_spec = ResidueModification::NUMBER_OF_TERM_SPECIFICITY);
186 
187 
208 
210  void getAllSearchModifications(std::vector<String>& modifications) const;
211 
213  void writeTSV(const String& filename);
214 
215  protected:
216 
218  static bool is_instantiated_;
219 
221  std::vector<ResidueModification*> mods_;
222 
224  std::unordered_map<String, std::set<const ResidueModification*> > modification_names_;
225 
240  bool residuesMatch_(const char residue, const ResidueModification* curr_mod) const;
241 
242 private:
243 
252  explicit ModificationsDB(OpenMS::String unimod_file = "CHEMISTRY/unimod.xml", OpenMS::String psimod_file = "CHEMISTRY/PSI-MOD.obo", OpenMS::String xlmod_file = "CHEMISTRY/XLMOD.obo");
253 
255  ModificationsDB(const ModificationsDB& residue_db);
256 
258  virtual ~ModificationsDB();
260 
267 
273  void readFromOBOFile(const String& filename);
274 
276  void readFromUnimodXMLFile(const String& filename);
277  };
278 }
Definition: CrossLinksDB.h:43
database which holds all residue modifications from UniMod
Definition: ModificationsDB.h:76
void searchModificationsByDiffMonoMass(std::vector< String > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
Collects all modifications with delta mass inside a tolerance window.
Size getNumberOfModifications() const
Returns the number of modifications read from the unimod.xml file.
static ModificationsDB * getInstance()
Returns a pointer to the modifications DB (singleton)
bool residuesMatch_(const char residue, const ResidueModification *curr_mod) const
Helper function to check if a residue matches the origin for a modification.
const ResidueModification * getBestModificationByDiffMonoMass(double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
Returns the best matching modification for the given delta mass and residue.
void writeTSV(const String &filename)
Writes tab separated entries: FullId,FullName,Origin,AA,TerminusSpecificity,DiffMonoMass (including h...
std::vector< ResidueModification * > mods_
Stores the modifications.
Definition: ModificationsDB.h:221
ModificationsDB & operator=(const ModificationsDB &aa)
Assignment operator.
void searchModificationsByDiffMonoMassSorted(std::vector< const ResidueModification * > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
bool has(const String &modification) const
Returns true if the modification exists.
Size findModificationIndex(const String &mod_name) const
Returns the index of the modification in the mods_ vector; a unique name must be given.
void searchModificationsByDiffMonoMass(std::vector< const ResidueModification * > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
ModificationsDB(OpenMS::String unimod_file="CHEMISTRY/unimod.xml", OpenMS::String psimod_file="CHEMISTRY/PSI-MOD.obo", OpenMS::String xlmod_file="CHEMISTRY/XLMOD.obo")
void searchModificationsByDiffMonoMassSorted(std::vector< String > &mods, double mass, double max_error, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY)
Collects all modifications with delta mass inside a tolerance window and adds them sorted by mass dif...
const ResidueModification * searchModificationsFast(const String &mod_name, bool &multiple_matches, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY) const
Returns the modification which has the given name as synonym (fast version)
static ModificationsDB * initializeModificationsDB(OpenMS::String unimod_file="CHEMISTRY/unimod.xml", OpenMS::String psimod_file="CHEMISTRY/PSI-MOD.obo", OpenMS::String xlmod_file="CHEMISTRY/XLMOD.obo")
Initializes the modification DB with non-default modification files (can only be done once)
void readFromUnimodXMLFile(const String &filename)
Adds modifications from a given file in Unimod XML format.
virtual ~ModificationsDB()
Destructor.
static bool isInstantiated()
Check whether ModificationsDB was instantiated before.
const ResidueModification * getModification(const String &mod_name, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY) const
Returns the modification with the given name.
const ResidueModification * getModification(Size index) const
Returns the modification with the given index. note: out-of-bounds check is only performed in debug m...
static bool is_instantiated_
Stores whether ModificationsDB was instantiated before.
Definition: ModificationsDB.h:218
void searchModifications(std::set< const ResidueModification * > &mods, const String &mod_name, const String &residue="", ResidueModification::TermSpecificity term_spec=ResidueModification::NUMBER_OF_TERM_SPECIFICITY) const
Collects all modifications which have the given name as synonym.
ModificationsDB(const ModificationsDB &residue_db)
Copy constructor.
void readFromOBOFile(const String &filename)
Adds modifications from a given file in OBO format.
const ResidueModification * addModification(std::unique_ptr< ResidueModification > new_mod)
Add a new modification to ModificationsDB. If the modification already exists (based on its fullID) i...
void getAllSearchModifications(std::vector< String > &modifications) const
Collects all modifications that can be used for identification searches.
std::unordered_map< String, std::set< const ResidueModification * > > modification_names_
Stores the mappings of (unique) names to the modifications.
Definition: ModificationsDB.h:224
Representation of a modification.
Definition: ResidueModification.h:77
TermSpecificity
Position where the modification is allowed to occur.
Definition: ResidueModification.h:96
@ NUMBER_OF_TERM_SPECIFICITY
Definition: ResidueModification.h:102
A more convenient string class.
Definition: String.h:61
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:47