OpenMS
QTCluster.h
Go to the documentation of this file.
1 // Copyright (c) 2002-2023, The OpenMS Team -- EKU Tuebingen, ETH Zurich, and FU Berlin
2 // SPDX-License-Identifier: BSD-3-Clause
3 //
4 // --------------------------------------------------------------------------
5 // $Maintainer: Hendrik Weisser $
6 // $Authors: Steffen Sass, Hendrik Weisser $
7 // --------------------------------------------------------------------------
8 
9 
10 #pragma once
11 
12 #include <OpenMS/CONCEPT/Types.h>
14 #include <OpenMS/OpenMSConfig.h>
15 #include <OpenMS/config.h>
16 
17 #include <unordered_map>
18 
19 #include <map> // for multimap<>
20 #include <vector> // for vector<>
21 #include <set> // for set<>
22 #include <utility> // for pair<>
23 
24 namespace OpenMS
25 {
26  class GridFeature;
27 
81  class OPENMS_DLLAPI QTCluster
82  {
83 public:
84 
85  // need to store more than one
86  typedef std::multimap<double, const GridFeature*> NeighborList;
87  typedef std::unordered_map<Size, NeighborList> NeighborMapMulti;
88 
89  struct Neighbor
90  {
91  double distance;
93  };
94 
95  typedef std::unordered_map<Size, Neighbor> NeighborMap;
96 
97  struct Element
98  {
101  };
102 
103  typedef std::vector<Element> Elements;
104 
111  class OPENMS_DLLAPI BulkData
112  {
113  friend class QTCluster;
114 
115  public:
116 
124  BulkData(const OpenMS::GridFeature* const center_point,
125  Size num_maps, double max_distance,
126  Int x_coord, Int y_coord, Size id);
127 
128  private:
129 
132 
135 
141 
150 
153 
156 
159 
162 
169  std::set<AASequence> annotations_;
170  };
171 
178  QTCluster(BulkData* const data, bool use_IDs);
179 
185  QTCluster() = delete;
186 
193  QTCluster(const QTCluster& rhs) = default;
194 
196  QTCluster& operator=(const QTCluster& rhs) = default;
197 
199  QTCluster(QTCluster&& rhs) = default;
200 
202  QTCluster& operator=(QTCluster&& rhs) = default;
203 
204  ~QTCluster() = default;
205 
207  const GridFeature* getCenterPoint() const;
208 
210  Size getId() const;
211 
213  double getCenterRT() const;
214 
216  double getCenterMZ() const;
217 
219  Int getXCoord() const;
220 
222  Int getYCoord() const;
223 
225  Size size() const;
226 
228  bool operator<(const QTCluster& cluster) const;
229 
236  void add(const GridFeature* const element, double distance);
237 
240 
248  bool update(const Elements& removed);
249 
251  double getQuality();
252 
254  double getCurrentQuality() const;
255 
257  const std::set<AASequence>& getAnnotations();
258 
266  void setInvalid();
267 
269  inline bool isInvalid() const
270  {
271  return !valid_;
272  }
273 
276 
279 
282 
283  private:
286 
307 
309  void makeSeqTable_(std::map<AASequence, std::map<Size,double>>& seq_table) const;
310 
313 
315  double quality_;
316 
319 
321  bool valid_;
322 
324  bool changed_;
325 
327  bool use_IDs_;
328 
339 
342  };
343 
344 } // namespace OpenMS
Representation of a peptide/protein sequence.
Definition: AASequence.h:86
Representation of a feature in a hash grid.
Definition: GridFeature.h:27
Class to store the bulk internal data (neighbors, annotations, etc.)
Definition: QTCluster.h:112
NeighborMapMulti tmp_neighbors_
Temporary map tracking *all* neighbors.
Definition: QTCluster.h:149
BulkData(const OpenMS::GridFeature *const center_point, Size num_maps, double max_distance, Int x_coord, Int y_coord, Size id)
Detailed constructor of the cluster body.
Int x_coord_
x coordinate in the grid cell
Definition: QTCluster.h:158
const GridFeature *const center_point_
Pointer to the cluster center.
Definition: QTCluster.h:131
std::set< AASequence > annotations_
Set of annotations of the cluster.
Definition: QTCluster.h:169
NeighborMap neighbors_
Map that keeps track of the best current feature for each map.
Definition: QTCluster.h:140
Size num_maps_
Number of input maps.
Definition: QTCluster.h:155
Int y_coord_
y coordinate in the grid cell
Definition: QTCluster.h:161
double max_distance_
Maximum distance of a point that can still belong to the cluster.
Definition: QTCluster.h:152
Size id_
unique id of this cluster
Definition: QTCluster.h:134
A representation of a QT cluster used for feature grouping.
Definition: QTCluster.h:82
std::vector< Element > Elements
Definition: QTCluster.h:103
const std::set< AASequence > & getAnnotations()
Return the set of peptide sequences annotated to the cluster center.
void setInvalid()
Sets current cluster as invalid (also frees some memory)
Int getXCoord() const
Returns the x coordinate in the grid.
void initializeCluster()
Has to be called before adding elements (calling QTCluster::add)
double getCurrentQuality() const
Returns the cluster quality without recomputing.
QTCluster(const QTCluster &rhs)=default
Cheap copy ctor because most of the data lies outside of this class (BulkData*) Be very careful with ...
bool isInvalid() const
Whether current cluster is invalid.
Definition: QTCluster.h:269
bool valid_
Whether current cluster is valid.
Definition: QTCluster.h:321
void add(const GridFeature *const element, double distance)
Adds a new element/neighbor to the cluster.
double quality_
Quality of the cluster.
Definition: QTCluster.h:315
bool collect_annotations_
Whether initial collection of all neighbors is needed.
Definition: QTCluster.h:338
QTCluster & operator=(const QTCluster &rhs)=default
Cheap copy assignment, see copy ctor for details.
bool operator<(const QTCluster &cluster) const
Compare by quality.
void recomputeNeighbors_()
report elements that are compatible with the optimal annotation
const GridFeature * getCenterPoint() const
Returns the cluster center.
void makeSeqTable_(std::map< AASequence, std::map< Size, double >> &seq_table) const
compute seq table, mapping: peptides -> best distance per input map
std::multimap< double, const GridFeature * > NeighborList
Definition: QTCluster.h:86
Size map_index
Definition: QTCluster.h:99
Size getId() const
returns the clusters id
void finalizeCluster()
Has to be called after adding elements (after calling QTCluster::add one or multiple times)
double distance
Definition: QTCluster.h:91
BulkData * data_
Pointer to data members.
Definition: QTCluster.h:318
double optimizeAnnotations_()
Finds the optimal annotation (peptide sequences) for the cluster.
~QTCluster()=default
Elements getAllNeighbors() const
Get all current neighbors.
bool changed_
Has the cluster changed (if yes, quality needs to be recomputed)?
Definition: QTCluster.h:324
bool use_IDs_
Keep track of peptide IDs and use them for matching?
Definition: QTCluster.h:327
std::unordered_map< Size, NeighborList > NeighborMapMulti
Definition: QTCluster.h:87
bool update(const Elements &removed)
Updates the cluster after the indicated data points are removed.
Size size() const
Returns the size of the cluster (number of elements, incl. center)
QTCluster(BulkData *const data, bool use_IDs)
Detailed constructor of the cluster head.
double getQuality()
Returns the cluster quality and recomputes if necessary.
double getCenterMZ() const
Returns the m/z value of the cluster center.
QTCluster(QTCluster &&rhs)=default
cheap move ctor because most of the data lies outside of this class (BulkData*)
QTCluster & operator=(QTCluster &&rhs)=default
cheap move assignment because most of the data lies outside of this class (BulkData*)
Int getYCoord() const
Returns the y coordinate in the grid.
double getCenterRT() const
Returns the RT value of the cluster.
bool finalized_
Whether current cluster is accepting new elements or not (if true, no more new elements allowed)
Definition: QTCluster.h:341
const GridFeature * feature
Definition: QTCluster.h:92
void computeQuality_()
Computes the quality of the cluster.
QTCluster()=delete
Default constructor not accessible Objects of this class should only exist with a valid BulkData* giv...
Elements getElements() const
Gets the clustered elements meaning neighbors + cluster center.
std::unordered_map< Size, Neighbor > NeighborMap
Definition: QTCluster.h:95
Definition: QTCluster.h:98
Definition: QTCluster.h:90
int Int
Signed integer type.
Definition: Types.h:76
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:101
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:22