OpenMS
Loading...
Searching...
No Matches
DTA2DFile.h
Go to the documentation of this file.
1// Copyright (c) 2002-present, OpenMS Inc. -- EKU Tuebingen, ETH Zurich, and FU Berlin
2// SPDX-License-Identifier: BSD-3-Clause
3//
4// --------------------------------------------------------------------------
5// $Maintainer: Timo Sachsenberg $
6// $Authors: Marc Sturm $
7// --------------------------------------------------------------------------
8
9#pragma once
10
15#include <OpenMS/SYSTEM/File.h>
16
17#include <fstream>
18#include <iostream>
19
20namespace OpenMS
21{
40 class OPENMS_DLLAPI DTA2DFile :
41 public ProgressLogger
42 {
43private:
45
46public:
47
53 ~DTA2DFile() override;
55
58
61
71 template <typename MapType>
72 void load(const std::string& filename, MapType& map)
73 {
74 startProgress(0, 0, "loading DTA2D file");
75
76 //try to open file
77 std::ifstream is(filename.c_str());
78 if (!is)
79 {
80 if (!File::exists(filename))
81 {
82 throw Exception::FileNotFound(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, filename);
83 }
84 else if (!File::readable(filename))
85 {
86 throw Exception::FileNotReadable(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, filename);
87 }
88 else
89 {
90 throw Exception::IOException(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, filename);
91 }
92 }
93
94 map.reset();
95
96 //set DocumentIdentifier
97 map.setLoadedFileType(filename);
98 map.setLoadedFilePath(filename);
99
100 // temporary variables to store the data in
101 std::vector<std::string> strings(3);
102 typename MapType::SpectrumType spec;
103 spec.setRT(-1.0); //to make sure the first RT is different from the the initialized value
105 double rt(0.0);
106 char delimiter;
107
108 // default dimension of the data
109 Size rt_dim = 0;
110 Size mz_dim = 1;
111 Size int_dim = 2;
112
113 //RT unit (default is seconds)
114 bool time_in_minutes = false;
115
116 // string to store the current line in
117 std::string line;
118
119 // native ID (numbers from 0)
120 UInt native_id = 0;
121
122 // line number counter
123 Size line_number = 0;
124
125 while (getline(is, line, '\n'))
126 {
127 ++line_number;
128 StringUtils::trim(line);
129
130 if (line.empty()) continue;
131
132 //test which delimiter is used in the line
133 if (StringUtils::has(line, '\t'))
134 {
135 delimiter = '\t';
136 }
137 else
138 {
139 delimiter = ' ';
140 }
141
142 //is header line
143 if (StringUtils::hasPrefix(line, "#"))
144 {
145 line = StringUtils::trimmed(line.substr(1));
146 StringUtils::toUpper(line);
147 StringUtils::split(line, delimiter, strings);
148
149 // flags to check if dimension is set correctly
150 bool rt_set = false;
151 bool mz_set = false;
152 bool int_set = false;
153
154 //assign new order
155 for (Size i = 0; i < 3; ++i)
156 {
157 if (strings[i] == "RT" || strings[i] == "RETENTION_TIME" || strings[i] == "MASS-TO-CHARGE" || strings[i] == "IT" || strings[i] == "INTENSITY")
158 {
159 std::cerr << "Warning: This file contains the deprecated keyword '" << strings[i] << "'." << "\n";
160 std::cerr << " Please use only the new keywords SEC/MIN, MZ, INT." << "\n";
161 }
162 if ((strings[i] == "SEC" || strings[i] == "RT" || strings[i] == "RETENTION_TIME") && rt_set == false)
163 {
164 rt_dim = i;
165 rt_set = true;
166 }
167 else if ((strings[i] == "MIN") && rt_set == false)
168 {
169 rt_dim = i;
170 rt_set = true;
171 time_in_minutes = true;
172 }
173 else if ((strings[i] == "MZ" || strings[i] == "MASS-TO-CHARGE") && mz_set == false)
174 {
175 mz_dim = i;
176 mz_set = true;
177 }
178 else if ((strings[i] == "INT" || strings[i] == "IT" || strings[i] == "INTENSITY") && int_set == false)
179 {
180 int_dim = i;
181 int_set = true;
182 }
183 else
184 {
185 throw Exception::ParseError(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, "Misformatted header line!", filename);
186 }
187 }
188 continue;
189 }
190
191 try
192 {
193 StringUtils::split(line, delimiter, strings);
194 if (strings.size() != 3)
195 {
196 throw Exception::ParseError(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, std::string("Bad data line (" + StringUtils::toStr(line_number) + "): \"") + line + "\" (got " + StringUtils::toStr(strings.size()) + ", expected 3 entries)", filename);
197 }
198 p.setIntensity(StringUtils::toFloat(strings[int_dim]));
199 p.setMZ(StringUtils::toDouble(strings[mz_dim]));
200 rt = (StringUtils::toDouble(strings[rt_dim])) * (time_in_minutes ? 60.0 : 1.0);
201 }
202 // conversion to double or something else could have gone wrong
203 catch (Exception::BaseException& /*e*/)
204 {
205 throw Exception::ParseError(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, std::string("Bad data line (" + StringUtils::toStr(line_number) + "): \"") + line + "\"", filename);
206 }
207
208 // Retention time changed -> new Spectrum
209 if (fabs(rt - spec.getRT()) > 0.0001)
210 {
211 if (spec.size() != 0
212 &&
213 (!options_.hasRTRange() || options_.getRTRange().encloses(DPosition<1>(spec.getRT())))) // RT restriction fulfilled
214 {
215 map.addSpectrum(spec);
216 }
217 setProgress(0);
218 spec.clear(true);
219 spec.setRT(rt);
220 spec.setNativeID(std::string("index=") + native_id);
221 ++native_id;
222 }
223
224 //Skip peaks with invalid m/z or intensity value
225 if (
226 (!options_.hasMZRange() || options_.getMZRange().encloses(DPosition<1>(p.getMZ())))
227 &&
229 )
230 {
231 spec.push_back(p);
232 }
233 }
234
235 // add last Spectrum
236 if (
237 spec.size() != 0
238 &&
239 (!options_.hasRTRange() || options_.getRTRange().encloses(DPosition<1>(spec.getRT()))) // RT restriction fulfilled
240 )
241 {
242 map.addSpectrum(spec);
243 }
244
245 is.close();
246 map.updateRanges();
247 endProgress();
248 }
249
258 template <typename MapType>
259 void store(const std::string& filename, const MapType& map) const
260 {
261 startProgress(0, map.size(), "storing DTA2D file");
262
263 std::ofstream os(filename.c_str());
264 if (!os)
265 {
266 throw Exception::UnableToCreateFile(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, filename);
267 }
268
269 // write header
270 os << "#SEC\tMZ\tINT\n";
271
272 // Iterate over all peaks of each spectrum and
273 // write one line for each peak of the spectrum.
274 UInt count = 0;
275 for (typename MapType::const_iterator spec = map.begin(); spec != map.end(); ++spec)
276 {
277 setProgress(count++);
278 for (typename MapType::SpectrumType::ConstIterator it = spec->begin(); it != spec->end(); ++it)
279 {
280 // Write rt, m/z and intensity.
281 os << precisionWrapper(spec->getRT()) << "\t" << precisionWrapper(it->getPos()) << "\t" << precisionWrapper(it->getIntensity()) << "\n";
282 }
283
284 }
285 os.close();
286 endProgress();
287 }
288
297 template <typename MapType>
298 void storeTIC(const std::string& filename, const MapType& map) const
299 {
300 startProgress(0, map.size(), "storing DTA2D file");
301
302 std::ofstream os(filename.c_str());
303 if (!os)
304 {
305 throw Exception::UnableToCreateFile(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, filename);
306 }
307
308 // write header (Always MZ=0 for chromatograms in DTA2D.)
309 os << "#SEC\tMZ\tINT\n";
310
312 for (typename MapType::ChromatogramType::ConstIterator it = TIC.begin(); it != TIC.end(); ++it)
313 {
314 // write rt, (mz=0) and intensity.
315 os << precisionWrapper(it->getRT()) << "\t0\t" << precisionWrapper(it->getIntensity()) << "\n";
316 }
317
318 os.close();
319 endProgress();
320 }
321
322 };
323
324} // namespace OpenMS
325
Representation of a coordinate in D-dimensional space.
Definition DPosition.h:32
bool encloses(const PositionType &position) const
Checks whether this range (half open interval!) contains a certain point.
Definition DRange.h:152
DTA2D File adapter.
Definition DTA2DFile.h:42
void load(const std::string &filename, MapType &map)
Loads a map from a DTA2D file.
Definition DTA2DFile.h:72
~DTA2DFile() override
Destructor.
DTA2DFile()
Default constructor.
const PeakFileOptions & getOptions() const
Non-mutable access to the options for loading/storing.
PeakFileOptions options_
Definition DTA2DFile.h:44
void storeTIC(const std::string &filename, const MapType &map) const
Stores the TIC of a map in a DTA2D file.
Definition DTA2DFile.h:298
PeakFileOptions & getOptions()
Mutable access to the options for loading/storing.
void store(const std::string &filename, const MapType &map) const
Stores a map in a DTA2D file.
Definition DTA2DFile.h:259
void setLoadedFileType(const std::string &file_name)
set the file_type according to the type of the file loaded from (see FileHandler::Type) preferably do...
void setLoadedFilePath(const std::string &file_name)
set the file_name_ according to absolute path of the file loaded from preferably done whilst loading
Exception base class.
Definition Exception.h:63
File not found exception.
Definition Exception.h:475
File not readable exception.
Definition Exception.h:501
General IOException.
Definition Exception.h:541
Parse Error exception.
Definition Exception.h:593
Unable to create file exception.
Definition Exception.h:606
The representation of a chromatogram.
Definition MSChromatogram.h:30
In-Memory representation of a mass spectrometry run.
Definition MSExperiment.h:49
void addSpectrum(const MSSpectrum &spectrum)
adds a spectrum to the list
Iterator begin() noexcept
Size size() const noexcept
The number of spectra.
const MSChromatogram calculateTIC(float rt_bin_size=0, UInt ms_level=1) const
Computes the total ion chromatogram (TIC) for a given MS level (use ms_level = 0 for all levels).
void reset()
Clear all internal data (spectra, chromatograms, ranges, metadata)
void updateRanges()
Updates the m/z, intensity, mobility, and retention time ranges of all spectra and chromatograms.
Base::const_iterator const_iterator
Definition MSExperiment.h:98
std::vector< SpectrumType >::const_iterator ConstIterator
Non-mutable iterator.
Definition MSExperiment.h:86
The representation of a 1D spectrum.
Definition MSSpectrum.h:44
double getRT() const
void clear(bool clear_meta_data)
Clears all data and meta data.
void setRT(double rt)
Sets the absolute retention time (in seconds)
A 1-dimensional raw data point or peak.
Definition Peak1D.h:30
CoordinateType getMZ() const
Non-mutable access to m/z.
Definition Peak1D.h:89
IntensityType getIntensity() const
Definition Peak1D.h:84
void setIntensity(IntensityType intensity)
Mutable access to the data point intensity (height)
Definition Peak1D.h:86
void setMZ(CoordinateType mz)
Mutable access to m/z.
Definition Peak1D.h:95
Options for loading files containing peak data.
Definition PeakFileOptions.h:22
bool hasRTRange() const
returns true if an RT range has been set
const DRange< 1 > & getIntensityRange() const
returns the intensity range
bool hasMZRange() const
returns true if an MZ range has been set
bool hasIntensityRange() const
returns true if an intensity range has been set
const DRange< 1 > & getMZRange() const
returns the MZ range
const DRange< 1 > & getRTRange() const
returns the RT range
Base class for all classes that want to report their progress.
Definition ProgressLogger.h:27
void setNativeID(const std::string &native_id)
sets the native identifier for the spectrum, used by the acquisition software.
Total Ion Current (TIC) as a QC metric.
Definition TIC.h:33
unsigned int UInt
Unsigned integer type.
Definition Types.h:64
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition Types.h:97
Main OpenMS namespace.
Definition openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19
const PrecisionWrapper< FloatingPointType > precisionWrapper(const FloatingPointType rhs)
Wrapper function that sets the appropriate precision for output temporarily. The original precision i...
Definition PrecisionWrapper.h:69