 |
OpenMS
3.0.0
|
|
Go to the documentation of this file.
45 #include <boost/regex.hpp>
50 class PeptideIdentification;
93 double cut_off = DBL_MAX;
104 double suitability = 0;
108 double suitability_no_rerank = 0;
111 double suitability_corr_no_rerank = 0;
118 void setCorrectionFactor(
double factor);
120 double getCorrectionFactor()
const;
122 double getCorrectedNovoHits()
const;
124 double getCorrectedSuitability()
const;
145 double num_top_novo_corr = 0;
152 double suitability_corr = 0;
229 void compute(std::vector<PeptideIdentification>&& pep_ids,
const MSExperiment& exp,
const std::vector<FASTAFile::FASTAEntry>& original_fasta,
const std::vector<FASTAFile::FASTAEntry>& novo_fasta,
const ProteinIdentification::SearchParameters& search_params);
240 const std::vector<SuitabilityData>& getResults()
const;
279 double getDecoyCutOff_(
const std::vector<PeptideIdentification>& pep_ids,
double reranking_cutoff_percentile)
const;
304 bool checkScoreBetterThanThreshold_(
const PeptideHit& hit,
double threshold,
bool higher_score_better)
const;
325 void writeIniFile_(
const Param& parameters,
const String& filename)
const;
349 std::vector<PeptideIdentification> runIdentificationSearch_(
const MSExperiment& exp,
const std::vector<FASTAFile::FASTAEntry>& fasta_data,
const String& adapter_name,
Param& parameters)
const;
361 std::vector<FASTAFile::FASTAEntry> getSubsampledFasta_(
const std::vector<FASTAFile::FASTAEntry>& fasta_data,
double subsampling_rate)
const;
379 void calculateSuitability_(
const std::vector<PeptideIdentification>& pep_ids,
SuitabilityData& data)
const;
390 void appendDecoys_(std::vector<FASTAFile::FASTAEntry>& fasta)
const;
399 double extractScore_(
const PeptideHit& pep_hit)
const;
424 UInt numberOfUniqueProteins_(
const std::vector<PeptideIdentification>& peps,
UInt number_of_hits = 1)
const;
434 Size getIndexWithMedianNovoHits_(
const std::vector<SuitabilityData>& data)
const;
452 double getScoreMatchingFDR_(
const std::vector<PeptideIdentification>& pep_ids,
double FDR,
String score_name,
bool higher_score_better)
const;
463 std::vector<FASTAFile::FASTAEntry>
getSubsampledFasta(
const std::vector<FASTAFile::FASTAEntry>& fasta_data,
double subsampling_rate)
Size getIndexWithMedianNovoHits(const std::vector< DBSuitability::SuitabilityData > &data)
Definition: DBSuitability.h:483
double corr_factor
Definition: DBSuitability.h:142
~DBSuitability_friend()=default
std::vector< SuitabilityData > results_
result vector
Definition: DBSuitability.h:244
Size getIndexWithMedianNovoHits_(const std::vector< SuitabilityData > &data) const
Finds the SuitabilityData object with the median number of de novo hits.
Definition: DBSuitability.h:456
A more convenient string class.
Definition: String.h:58
In-Memory representation of a mass spectrometry run.
Definition: MSExperiment.h:70
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:127
double calculateCorrectionFactor(const DBSuitability::SuitabilityData &data, const DBSuitability::SuitabilityData &data_sampled, double sampling_rate)
Definition: DBSuitability.h:473
UInt numberOfUniqueProteins(const std::vector< PeptideIdentification > &peps, UInt number_of_hits=1)
Definition: DBSuitability.h:478
double calculateCorrectionFactor_(const SuitabilityData &data, const SuitabilityData &data_sampled, double sampling_rate) const
Calculates the correction factor from two suitability calculations.
This class holds the functionality of calculating the database suitability.
Definition: DBSuitability.h:71
double getScoreMatchingFDR(const std::vector< PeptideIdentification > &pep_ids, double FDR, String score_name, bool higher_score_better)
Definition: DBSuitability.h:488
DBSuitability suit_
Definition: DBSuitability.h:505
A base class for all classes handling default parameters.
Definition: DefaultParamHandler.h:92
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:47
const boost::regex decoy_pattern_
pattern for finding a decoy string
Definition: DBSuitability.h:247
std::vector< FASTAFile::FASTAEntry > getSubsampledFasta(const std::vector< FASTAFile::FASTAEntry > &fasta_data, double subsampling_rate)
Definition: DBSuitability.h:463
unsigned int UInt
Unsigned integer type.
Definition: Types.h:94
Represents the peptide hits for a spectrum.
Definition: PeptideIdentification.h:63
void appendDecoys(std::vector< FASTAFile::FASTAEntry > &fasta)
Definition: DBSuitability.h:468
double getScoreMatchingFDR_(const std::vector< PeptideIdentification > &pep_ids, double FDR, String score_name, bool higher_score_better) const
Extracts the worst score that still passes a FDR (q-value) threshold.
Management and storage of parameters / INI files.
Definition: Param.h:69
struct to store results
Definition: DBSuitability.h:76
UInt numberOfUniqueProteins_(const std::vector< PeptideIdentification > &peps, UInt number_of_hits=1) const
Determines the number of unique proteins found in the protein accessions of PeptideIdentifications.
Search parameters of the DB search.
Definition: ProteinIdentification.h:258
void appendDecoys_(std::vector< FASTAFile::FASTAEntry > &fasta) const
Calculates and appends decoys to a given vector of FASTAEntry.
DBSuitability_friend()=default
std::vector< FASTAFile::FASTAEntry > getSubsampledFasta_(const std::vector< FASTAFile::FASTAEntry > &fasta_data, double subsampling_rate) const
Creates a subsampled fasta with the given subsampling rate.
Representation of a peptide hit.
Definition: PeptideHit.h:55