44 #include <boost/math/special_functions/fpclassify.hpp>
66 typedef std::map<std::pair<String, String>, std::vector<PeptideHit> >
MapAccPepType;
74 const std::vector<ProteinIdentification>& protein_identifications,
75 const std::vector<PeptideIdentification>& peptide_identifications,
76 bool first_run_inference_only,
77 bool export_empty_pep_ids =
false,
78 bool export_all_psms =
false,
79 const String& title =
"ID export from OpenMS");
85 const bool first_run_inference_only,
86 const bool export_unidentified_features,
87 const bool export_unassigned_ids,
88 const bool export_subfeatures,
89 const bool export_empty_pep_ids =
false,
90 const bool export_all_psms =
false)
const;
129 const Size n_best_search_engine_scores,
130 const std::vector<String>& optional_columns,
132 size_t& n_columns)
const;
163 output.reserve(output.size() + rows.size() + 1);
164 for (
const auto& row : rows)
166 size_t n_section_columns = 0;
167 output.push_back(generateMzTabSectionRow_(row, optional_columns, meta, n_section_columns));
168 if (n_header_columns != n_section_columns)
throw Exception::Postcondition(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION,
"Header and content differs in columns. Please report this bug to the OpenMS developers.");
180 static void sortPSM_(std::vector<PeptideIdentification>::iterator begin, std::vector<PeptideIdentification>::iterator end);
182 static void keepFirstPSM_(std::vector<PeptideIdentification>::iterator begin, std::vector<PeptideIdentification>::iterator end);
186 const std::vector<ProteinIdentification>& pro_ids,
187 std::map<
String, std::vector<PeptideIdentification> >& map_run_to_pepids,
188 std::map<
String, std::vector<ProteinIdentification> >& map_run_to_proids
229 const std::map<String, Size>& map_run_to_num_sub
A container for consensus elements.
Definition: ConsensusMap.h:88
Postcondition failed exception.
Definition: Exception.h:174
File adapter for MzTab files.
Definition: MzTabFile.h:59
static void sortPSM_(std::vector< PeptideIdentification >::iterator begin, std::vector< PeptideIdentification >::iterator end)
String generateMzTabProteinHeader_(const MzTabProteinSectionRow &reference_row, const Size n_best_search_engine_scores, const std::vector< String > &optional_columns, const MzTabMetaData &meta, size_t &n_columns) const
void storePSMUriColumn(bool store)
static void keepFirstPSM_(std::vector< PeptideIdentification >::iterator begin, std::vector< PeptideIdentification >::iterator end)
static std::pair< int, int > extractIndexPairsFromBrackets_(const String &s)
void store(const String &filename, const std::vector< ProteinIdentification > &protein_identifications, const std::vector< PeptideIdentification > &peptide_identifications, bool first_run_inference_only, bool export_empty_pep_ids=false, bool export_all_psms=false, const String &title="ID export from OpenMS")
String generateMzTabOSMHeader_(Size n_search_engine_scores, const std::vector< String > &optional_columns, size_t &n_columns) const
static String mapSearchEngineScoreToCvParam_(const String &openms_search_engine_name, double score, String score_type)
bool store_osm_uri_
Definition: MzTabFile.h:121
bool store_psm_uri_
Definition: MzTabFile.h:113
static void writePeptideHeader_(SVOutStream &output, std::map< String, Size > n_sub_samples)
bool store_smallmolecule_reliability_
Definition: MzTabFile.h:110
String generateMzTabSectionRow_(const MzTabPSMSectionRow &row, const std::vector< String > &optional_columns, const MzTabMetaData &meta, size_t &n_columns) const
bool store_protein_goterms_
Definition: MzTabFile.h:115
void storeSmallMoleculeReliabilityColumn(bool store)
bool store_protein_uri_
Definition: MzTabFile.h:111
bool store_nucleic_acid_goterms_
Definition: MzTabFile.h:122
void storePSMReliabilityColumn(bool store)
bool store_protein_reliability_
Definition: MzTabFile.h:107
static String mapSearchEngineToCvParam_(const String &openms_search_engine_name)
Map search engine identifier to CV, param etc.
bool store_psm_reliability_
Definition: MzTabFile.h:109
String generateMzTabSectionRow_(const MzTabSmallMoleculeSectionRow &row, const std::vector< String > &optional_columns, const MzTabMetaData &meta, size_t &n_columns) const
String generateMzTabSectionRow_(const MzTabProteinSectionRow &row, const std::vector< String > &optional_columns, const MzTabMetaData &meta, size_t &n_columns) const
static void writeProteinData_(SVOutStream &output, const ProteinIdentification &prot_id, Size run_count, String input_filename, bool has_coverage, const MapAccPepType &map_run_accession_to_peptides, const std::map< String, Size > &map_run_to_num_sub)
bool store_oligonucleotide_uri_
Definition: MzTabFile.h:120
String generateMzTabSectionRow_(const MzTabNucleicAcidSectionRow &row, const std::vector< String > &optional_columns, const MzTabMetaData &meta, size_t &n_columns) const
static void writeProteinHeader_(SVOutStream &output, std::map< String, Size > n_sub_samples)
static void addOptionalColumnsToSectionRow_(const std::vector< String > &column_names, const std::vector< MzTabOptionalColumnEntry > &column_entries, StringList &output)
Helper function for "generateMzTabSectionRow_" functions.
String generateMzTabNucleicAcidHeader_(Size search_ms_runs, Size n_best_search_engine_scores, Size n_search_engine_scores, const std::vector< String > &optional_columns, size_t &n_columns) const
static String extractProteinAccession_(const PeptideHit &peptide_hit)
Extracts, if possible a unique protein accession for a peptide hit in mzTab format....
static String extractPeptideModifications_(const PeptideHit &peptide_hit)
Extracts, modifications and positions of a peptide hit in mzTab format.
static String extractNumPeptidesDistinct_(String common_identifier, String protein_accession, const MapAccPepType &map_run_accession_to_peptides)
bool store_smallmolecule_uri_
Definition: MzTabFile.h:114
static void createProteinToPeptideLinks_(const std::map< String, std::vector< PeptideIdentification > > &map_run_to_pepids, MapAccPepType &map_run_accession_to_pephits)
create links from protein to peptides
bool store_oligonucleotide_reliability_
Definition: MzTabFile.h:117
String generateMzTabSmallMoleculeHeader_(Size search_ms_runs, Size n_best_search_engine_scores, Size n_search_engine_score, Size assays, Size study_variables, const std::vector< String > &optional_columns, size_t &n_columns) const
String generateMzTabOligonucleotideHeader_(Size search_ms_runs, Size n_best_search_engine_scores, Size n_search_engine_score, const std::vector< String > &optional_columns, size_t &n_columns) const
String generateMzTabPeptideHeader_(Size search_ms_runs, Size n_best_search_engine_scores, Size n_search_engine_score, Size assays, Size study_variables, const std::vector< String > &optional_columns, size_t &n_columns) const
bool store_osm_reliability_
Definition: MzTabFile.h:118
void store(const String &filename, const MzTab &mz_tab) const
std::map< std::pair< String, String >, std::vector< PeptideHit > > MapAccPepType
Definition: MzTabFile.h:66
void store(const String &filename, const ConsensusMap &cmap, const bool first_run_inference_only, const bool export_unidentified_features, const bool export_unassigned_ids, const bool export_subfeatures, const bool export_empty_pep_ids=false, const bool export_all_psms=false) const
void storeProteinReliabilityColumn(bool store)
void storeProteinGoTerms(bool store)
void generateMzTabMetaDataSection_(const MzTabMetaData &map, StringList &sl) const
String generateMzTabSectionRow_(const MzTabPeptideSectionRow &row, const std::vector< String > &optional_columns, const MzTabMetaData &meta, size_t &n_columns) const
static String extractNumPeptidesUnambiguous_(String common_identifier, String protein_accession, const MapAccPepType &map_run_accession_to_peptides)
bool store_nucleic_acid_reliability_
Definition: MzTabFile.h:116
void storeSmallMoleculeUriColumn(bool store)
void load(const String &filename, MzTab &mz_tab)
MzTabFile()
Default constructor.
bool store_peptide_uri_
Definition: MzTabFile.h:112
String generateMzTabSectionRow_(const MzTabOSMSectionRow &row, const std::vector< String > &optional_columns, const MzTabMetaData &meta, size_t &n_columns) const
static String extractNumPeptides_(const String &common_identifier, const String &protein_accession, const MapAccPepType &map_run_accession_to_peptides)
String generateMzTabPSMHeader_(Size n_search_engine_scores, const std::vector< String > &optional_columns, size_t &n_columns) const
String generateMzTabSectionRow_(const MzTabOligonucleotideSectionRow &row, const std::vector< String > &optional_columns, const MzTabMetaData &meta, size_t &n_columns) const
static std::map< String, Size > extractNumberOfSubSamples_(const std::map< String, std::vector< ProteinIdentification > > &map_run_to_proids)
void storePeptideUriColumn(bool store)
bool store_peptide_reliability_
Definition: MzTabFile.h:108
void storeProteinUriColumn(bool store)
void generateMzTabSection_(const std::vector< SectionRow > &rows, const std::vector< String > &optional_columns, const MzTabMetaData &meta, StringList &output, size_t n_header_columns) const
Generate an mzTab section comprising multiple rows of the same type and perform sanity check.
Definition: MzTabFile.h:161
void storePeptideReliabilityColumn(bool store)
static void partitionIntoRuns_(const std::vector< PeptideIdentification > &pep_ids, const std::vector< ProteinIdentification > &pro_ids, std::map< String, std::vector< PeptideIdentification > > &map_run_to_pepids, std::map< String, std::vector< ProteinIdentification > > &map_run_to_proids)
Extract protein and peptide identifications for each run. maps are assumed empty.
bool store_nucleic_acid_uri_
Definition: MzTabFile.h:119
Data model of MzTab files. Please see the official MzTab specification at https://code....
Definition: MzTab.h:809
Representation of a peptide hit.
Definition: PeptideHit.h:57
Representation of a protein identification run.
Definition: ProteinIdentification.h:72
Stream class for writing to comma/tab/...-separated values files.
Definition: SVOutStream.h:56
A more convenient string class.
Definition: String.h:61
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
std::vector< String > StringList
Vector of String.
Definition: ListUtils.h:70
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:47
NUC - Nucleic acid section (table-based)
Definition: MzTab.h:693
OSM - OSM (oligonucleotide-spectrum match) section (table-based)
Definition: MzTab.h:763
OLI - Oligonucleotide section (table-based)
Definition: MzTab.h:728
PEP - Peptide section (Table based)
Definition: MzTab.h:574
SML Small molecule section (table based)
Definition: MzTab.h:663
PSM - PSM section (Table based)
Definition: MzTab.h:612
PRT - Protein section (Table based)
Definition: MzTab.h:535