OpenMS
Loading...
Searching...
No Matches
ControlledVocabulary.h
Go to the documentation of this file.
1// Copyright (c) 2002-present, OpenMS Inc. -- EKU Tuebingen, ETH Zurich, and FU Berlin
2// SPDX-License-Identifier: BSD-3-Clause
3//
4// --------------------------------------------------------------------------
5// $Maintainer: Timo Sachsenberg $
6// $Authors: Marc Sturm, Andreas Bertsch, Mathias Walzer $
7// --------------------------------------------------------------------------
8
9#pragma once
10
11#include <OpenMS/DATASTRUCTURES/ListUtils.h> // StringList
14
15#include <set>
16#include <map>
17
18namespace OpenMS
19{
28 class OPENMS_DLLAPI ControlledVocabulary
29 {
30 friend OPENMS_DLLAPI std::ostream& operator<<(std::ostream& os, const ControlledVocabulary& cv);
31
32public:
35 {
36 size_t operator()(const std::string& key) const noexcept
37 {
38 size_t hash = 14695981039346656037ull;
39 for (auto c : key)
40 {
41 hash ^= static_cast<unsigned char>(c);
42 hash *= 1099511628211ull;
43 }
44 return hash;
45 }
46 };
47
49 struct OPENMS_DLLAPI CVTerm
50 {
52 enum class XRefType
53 {
54 XSD_STRING = 0, // xsd:string A string
55 XSD_INTEGER, // xsd:integer Any integer
56 XSD_DECIMAL, // xsd:decimal Any real number
57 XSD_NEGATIVE_INTEGER, // xsd:negativeInteger Any negative integer
58 XSD_POSITIVE_INTEGER, // xsd:positiveInteger Any integer > 0
59 XSD_NON_NEGATIVE_INTEGER, // xsd:nonNegativeInteger Any integer >= 0
60 XSD_NON_POSITIVE_INTEGER, // xsd:nonPositiveInteger Any integer < 0
61 XSD_BOOLEAN, // xsd:boolean True or false
62 XSD_DATE, // xsd:date An XML-Schema date
63 XSD_ANYURI, // xsd:anyURI uniform resource identifier
64 NONE
65 };
66
67 static std::string getXRefTypeName(XRefType type);
68 //static bool isSearchEngineSpecificScore();
70
71 std::string name;
72 std::string id;
73 std::set<std::string> parents;
74 std::set<std::string> children;
75 bool obsolete;
76 std::string description;
81 std::set<std::string> units;
82
85
86 CVTerm(const CVTerm& rhs);
87
88 CVTerm& operator=(const CVTerm& rhs);
89
91 std::string toXMLString(const std::string& ref, const std::string& value =std::string("")) const;
92
94 std::string toXMLString(const std::string& ref, const DataValue& value) const;
95
96 };
97
100
103
105 const std::string& name() const;
106
108 const std::string& label() const;
109
111 const std::string& version() const;
112
114 const std::string& url() const;
115
125 void loadFromOBO(const std::string& name, const std::string& filename);
126
128 bool exists(const std::string& id) const;
129
131 bool hasTermWithName(const std::string& name) const;
132
138 const CVTerm& getTerm(const std::string& id) const;
139
145 const CVTerm& getTermByName(const std::string& name, const std::string& desc = "") const;
146
147
149 const std::map<std::string, CVTerm>& getTerms() const;
150
161 void getAllChildTerms(std::set<std::string>& terms, const std::string& parent_id) const;
162
171 void addAllChildTerms(std::set<std::string>& terms, const std::string& parent_id) const;
172
184 template <class LAMBDA>
185 bool iterateAllChildren(const std::string& parent_id, LAMBDA lbd) const
186 {
187 for (const auto& child_id : getTerm(parent_id).children)
188 {
189 if (lbd(child_id) || iterateAllChildren(child_id, lbd))
190 return true;
191 }
192 return false;
193 }
194
202 const ControlledVocabulary::CVTerm* checkAndGetTermByName(const std::string& name) const;
203
212 bool isChildOf(const std::string& child_id, const std::string& parent_id) const;
213
214
230
231protected:
237 bool checkName_(const std::string& id, const std::string& name, bool ignore_case = true) const;
238
240 // note: unordered_map would be faster (5% for loading mzML), but order differs across platforms
241 std::map<std::string, CVTerm> terms_;
243 std::map<std::string, std::string> namesToIds_;
245 std::string name_;
247 std::string label_;
249 std::string version_;
251 std::string url_;
252 };
253
255 OPENMS_DLLAPI std::ostream& operator<<(std::ostream& os, const ControlledVocabulary& cv);
256
257
258} // namespace OpenMS
259
Definition ControlledVocabulary.h:29
ControlledVocabulary()
Constructor.
bool exists(const std::string &id) const
Returns true if the term is in the CV. Returns false otherwise.
bool iterateAllChildren(const std::string &parent_id, LAMBDA lbd) const
Iterates over all children (incl. subchildren etc) of parent recursively, i.e. the whole subtree.
Definition ControlledVocabulary.h:185
const CVTerm & getTermByName(const std::string &name, const std::string &desc="") const
Returns a term specified by name.
std::map< std::string, CVTerm > terms_
Map from ID to CVTerm.
Definition ControlledVocabulary.h:241
std::string url_
CV URL.
Definition ControlledVocabulary.h:251
bool checkName_(const std::string &id, const std::string &name, bool ignore_case=true) const
checks if a name corresponds to an id
const std::string & name() const
Returns the CV name (set in the load method)
std::string label_
CV label.
Definition ControlledVocabulary.h:247
bool hasTermWithName(const std::string &name) const
Returns true if a term with the given name is in the CV. Returns false otherwise.
const std::string & version() const
Returns the CV version (set in the load method)
friend std::ostream & operator<<(std::ostream &os, const ControlledVocabulary &cv)
Print the contents to a stream.
std::string name_
Name set in the load method.
Definition ControlledVocabulary.h:245
const std::string & label() const
Returns the CV label (set in the load method)
void loadFromOBO(const std::string &name, const std::string &filename)
Loads the CV from an OBO file.
std::string version_
CV version.
Definition ControlledVocabulary.h:249
std::map< std::string, std::string > namesToIds_
Map from name to id.
Definition ControlledVocabulary.h:243
virtual ~ControlledVocabulary()
Destructor.
const ControlledVocabulary::CVTerm * checkAndGetTermByName(const std::string &name) const
Searches the existing terms for the given name.
void getAllChildTerms(std::set< std::string > &terms, const std::string &parent_id) const
Writes all child terms recursively into terms.
const std::map< std::string, CVTerm > & getTerms() const
returns all the terms stored in the CV
static const ControlledVocabulary & getPSIMSCV()
Returns a CV for parsing/storing PSI-MS related data, e.g. mzML, or handle accessions/ids in datastru...
bool isChildOf(const std::string &child_id, const std::string &parent_id) const
Returns if child is a child of parent.
const CVTerm & getTerm(const std::string &id) const
Returns a term specified by ID.
const std::string & url() const
Returns the CV url (set in the load method)
void addAllChildTerms(std::set< std::string > &terms, const std::string &parent_id) const
Writes the parent term and all descendant term IDs into terms.
Class to hold strings, numeric values, lists of strings and lists of numeric values.
Definition DataValue.h:32
std::vector< std::string > StringList
Vector of String.
Definition ListUtils.h:44
Main OpenMS namespace.
Definition openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19
std::ostream & operator<<(std::ostream &os, const AccurateMassSearchResult &amsr)
Representation of a CV term.
Definition ControlledVocabulary.h:50
std::string description
Term description.
Definition ControlledVocabulary.h:76
static std::string getXRefTypeName(XRefType type)
std::string toXMLString(const std::string &ref, const DataValue &value) const
get mzidentml formatted string. i.e. a cvparam xml element, ref should be the name of the ControlledV...
StringList unparsed
Unparsed lines from the definition file.
Definition ControlledVocabulary.h:78
StringList xref_binary
xref binary-data-type for the CV-term (list of all allowed data value types for the current binary da...
Definition ControlledVocabulary.h:80
bool obsolete
Flag that indicates of the term is obsolete.
Definition ControlledVocabulary.h:75
std::string name
if it is a score type, lookup has_order
Definition ControlledVocabulary.h:71
StringList synonyms
List of synonyms.
Definition ControlledVocabulary.h:77
XRefType xref_type
xref value-type for the CV-term
Definition ControlledVocabulary.h:79
std::set< std::string > parents
The parent IDs.
Definition ControlledVocabulary.h:73
XRefType
define xsd types allowed in cv term to specify their value-type
Definition ControlledVocabulary.h:53
std::set< std::string > units
unit accession ids, defined by relationship has units
Definition ControlledVocabulary.h:81
CVTerm & operator=(const CVTerm &rhs)
std::set< std::string > children
The child IDs.
Definition ControlledVocabulary.h:74
static bool isHigherBetterScore(ControlledVocabulary::CVTerm term)
std::string id
Identifier.
Definition ControlledVocabulary.h:72
std::string toXMLString(const std::string &ref, const std::string &value=std::string("")) const
get mzidentml formatted string. i.e. a cvparam xml element, ref should be the name of the ControlledV...
ensure same hash on all platforms (for reproducibility)-
Definition ControlledVocabulary.h:35
size_t operator()(const std::string &key) const noexcept
Definition ControlledVocabulary.h:36