OpenMS
PrecursorIonSelectionPreprocessing.h
Go to the documentation of this file.
1 // --------------------------------------------------------------------------
2 // OpenMS -- Open-Source Mass Spectrometry
3 // --------------------------------------------------------------------------
4 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,
5 // ETH Zurich, and Freie Universitaet Berlin 2002-2023.
6 //
7 // This software is released under a three-clause BSD license:
8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above copyright
11 // notice, this list of conditions and the following disclaimer in the
12 // documentation and/or other materials provided with the distribution.
13 // * Neither the name of any author or any participating institution
14 // may be used to endorse or promote products derived from this software
15 // without specific prior written permission.
16 // For a full list of authors, refer to the file AUTHORS.
17 // --------------------------------------------------------------------------
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING
22 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
23 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
24 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
25 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
26 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
27 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
28 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 //
30 // --------------------------------------------------------------------------
31 // $Maintainer: Timo Sachsenberg $
32 // $Authors: $
33 // --------------------------------------------------------------------------
34 //
35 
36 #pragma once
37 
42 
43 #include <set>
44 namespace OpenMS
45 {
46 
52  class OPENMS_DLLAPI PrecursorIonSelectionPreprocessing :
53  public DefaultParamHandler
54  {
55 public:
59 
61 
62  const std::map<String, std::vector<double> > & getProtMasses() const;
63 
64  const std::vector<double> & getMasses(const String& acc) const;
65 
66  const std::map<String, std::vector<double> > & getProteinRTMap() const;
67  const std::map<String, std::vector<double> > & getProteinPTMap() const;
68  const std::map<String, std::vector<String> > & getProteinPeptideSequenceMap() const;
69 
70 
80  void dbPreprocessing(const String& db_path, bool save = true);
81 
93  void dbPreprocessing(const String& db_path, const String& rt_model_path, const String& dt_model_path, bool save = true);
94 
95 
104 
106  double getWeight(double mass);
107 
108  double getRT(const String& prot_id, Size peptide_index);
109 
110  double getPT(const String& prot_id, Size peptide_index);
111 
112  void setFixedModifications(StringList & modifications);
113  const std::map<char, std::vector<String> > & getFixedModifications()
114  {
115  return fixed_modifications_;
116  }
117 
118  void setGaussianParameters(double mu, double sigma);
119  double getGaussMu() const
120  {
121  return mu_;
122  }
123 
124  double getGaussSigma() const
125  {
126  return sigma_;
127  }
128 
129  double getRTProbability(const String& prot_id, Size peptide_index, Feature & feature);
130  double getRTProbability(double pred_rt, Feature & feature);
131 
132 protected:
134  void savePreprocessedDB_(const String& db_path, const String& path);
135  void savePreprocessedDBWithRT_(const String& db_path, const String& path);
137  void loadPreprocessedDB_(const String& path);
140  Int getScanNumber_(double rt);
141  double getRTProbability_(double min_obs_rt, double max_obs_rt, double pred_rt);
143  void updateMembers_() override;
144 
146  std::vector<double> masses_;
148  std::set<AASequence> sequences_;
150  std::map<String, std::vector<double> > prot_masses_;
152  std::vector<double> bin_masses_;
154  std::vector<UInt> counter_;
157 
159  std::map<String, std::vector<double> > rt_prot_map_;
160  std::map<String, std::vector<double> > pt_prot_map_;
161  std::map<String, std::vector<String> > prot_peptide_seq_map_;
162  std::map<char, std::vector<String> > fixed_modifications_;
163  double sigma_;
164  double mu_;
165 
166 
167  };
168 }
169 
A base class for all classes handling default parameters.
Definition: DefaultParamHandler.h:92
An LC-MS feature.
Definition: Feature.h:72
This class implements the database preprocessing needing for precursor ion selection.
Definition: PrecursorIonSelectionPreprocessing.h:54
double getRT(const String &prot_id, Size peptide_index)
double getRTProbability(const String &prot_id, Size peptide_index, Feature &feature)
std::map< String, std::vector< String > > prot_peptide_seq_map_
Definition: PrecursorIonSelectionPreprocessing.h:161
const std::map< char, std::vector< String > > & getFixedModifications()
Definition: PrecursorIonSelectionPreprocessing.h:113
std::map< char, std::vector< String > > fixed_modifications_
Definition: PrecursorIonSelectionPreprocessing.h:162
double getGaussSigma() const
Definition: PrecursorIonSelectionPreprocessing.h:124
double sigma_
Definition: PrecursorIonSelectionPreprocessing.h:163
std::vector< UInt > counter_
counter for the bins
Definition: PrecursorIonSelectionPreprocessing.h:154
void savePreprocessedDB_(const String &db_path, const String &path)
saves the preprocessed db
UInt f_max_
maximal relative frequency of a mass
Definition: PrecursorIonSelectionPreprocessing.h:156
double mu_
Definition: PrecursorIonSelectionPreprocessing.h:164
bool fixed_mods_
Definition: PrecursorIonSelectionPreprocessing.h:158
const std::vector< double > & getMasses(const String &acc) const
std::vector< double > masses_
all tryptic masses of the distinct peptides in the database
Definition: PrecursorIonSelectionPreprocessing.h:146
void dbPreprocessing(const String &db_path, const String &rt_model_path, const String &dt_model_path, bool save=true)
Calculates tryptic peptide masses of a given database and stores masses and peptide sequences.
double getRTProbability_(double min_obs_rt, double max_obs_rt, double pred_rt)
double getPT(const String &prot_id, Size peptide_index)
const std::map< String, std::vector< double > > & getProteinPTMap() const
double getWeight(double mass)
get the weighted frequency of a mass
void filterTaxonomyIdentifier_(FASTAFile::FASTAEntry &entry)
pre-process fasta identifier
double getGaussMu() const
Definition: PrecursorIonSelectionPreprocessing.h:119
double getRTProbability(double pred_rt, Feature &feature)
void loadPreprocessing()
Loads tryptic peptide masses of a given database.
void dbPreprocessing(const String &db_path, bool save=true)
Calculates tryptic peptide masses of a given database and stores masses and peptide sequences.
void setGaussianParameters(double mu, double sigma)
PrecursorIonSelectionPreprocessing(const PrecursorIonSelectionPreprocessing &source)
void updateMembers_() override
update members method from DefaultParamHandler to update the members
PrecursorIonSelectionPreprocessing & operator=(const PrecursorIonSelectionPreprocessing &source)
void setFixedModifications(StringList &modifications)
std::map< String, std::vector< double > > pt_prot_map_
Definition: PrecursorIonSelectionPreprocessing.h:160
std::vector< double > bin_masses_
the masses of the bins used for preprocessing (only used if bins are not equidistant,...
Definition: PrecursorIonSelectionPreprocessing.h:152
std::map< String, std::vector< double > > prot_masses_
stores masses of tryptic peptides for proteins, key is the accession number
Definition: PrecursorIonSelectionPreprocessing.h:150
std::set< AASequence > sequences_
the sequences of the tryptic peptides
Definition: PrecursorIonSelectionPreprocessing.h:148
const std::map< String, std::vector< double > > & getProtMasses() const
void savePreprocessedDBWithRT_(const String &db_path, const String &path)
void loadPreprocessedDB_(const String &path)
loads the preprocessed db
const std::map< String, std::vector< double > > & getProteinRTMap() const
std::map< String, std::vector< double > > rt_prot_map_
Definition: PrecursorIonSelectionPreprocessing.h:159
const std::map< String, std::vector< String > > & getProteinPeptideSequenceMap() const
A more convenient string class.
Definition: String.h:60
int Int
Signed integer type.
Definition: Types.h:102
unsigned int UInt
Unsigned integer type.
Definition: Types.h:94
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
std::vector< String > StringList
Vector of String.
Definition: ListUtils.h:70
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:48
FASTA entry type (identifier, description and sequence) The first String corresponds to the identifie...
Definition: FASTAFile.h:72