36 #ifndef OPENMS_FILTERING_NOISEESTIMATION_SIGNALTONOISEESTIMATORMEANITERATIVE_H 37 #define OPENMS_FILTERING_NOISEESTIMATION_SIGNALTONOISEESTIMATORMEANITERATIVE_H 69 template <
typename Container = MSSpectrum>
96 this->
setName(
"SignalToNoiseEstimatorMeanIterative");
98 defaults_.
setValue(
"max_intensity", -1,
"maximal intensity considered for histogram construction. By default, it will be calculated automatically (see auto_mode)." \
99 " Only provide this parameter if you know what you are doing (and change 'auto_mode' to '-1')!" \
100 " All intensities EQUAL/ABOVE 'max_intensity' will not be added to the histogram." \
101 " If you choose 'max_intensity' too small, the noise estimate might be too small as well." \
102 " If chosen too big, the bins become quite large (which you could counter by increasing 'bin_count', which increases runtime).", ListUtils::create<String>(
"advanced"));
105 defaults_.
setValue(
"auto_max_stdev_factor", 3.0,
"parameter for 'max_intensity' estimation (if 'auto_mode' == 0): mean + 'auto_max_stdev_factor' * stdev", ListUtils::create<String>(
"advanced"));
110 defaults_.
setValue(
"auto_max_percentile", 95,
"parameter for 'max_intensity' estimation (if 'auto_mode' == 1): auto_max_percentile th percentile", ListUtils::create<String>(
"advanced"));
114 defaults_.
setValue(
"auto_mode", 0,
"method to use to determine maximal intensity: -1 --> use 'max_intensity'; 0 --> 'auto_max_stdev_factor' method (default); 1 --> 'auto_max_percentile' method", ListUtils::create<String>(
"advanced"));
124 defaults_.
setValue(
"stdev_mp", 3.0,
"multiplier for stdev", ListUtils::create<String>(
"advanced"));
128 defaults_.
setValue(
"min_required_elements", 10,
"minimum number of elements required in a window (otherwise it is considered sparse)");
131 defaults_.
setValue(
"noise_for_empty_window", std::pow(10.0, 20),
"noise value used for sparse windows", ListUtils::create<String>(
"advanced"));
149 if (&source ==
this)
return *
this;
172 virtual void computeSTN_(
const PeakIterator & scan_first_,
const PeakIterator & scan_last_)
175 double sparse_window_percent = 0;
196 OPENMS_PRETTY_FUNCTION,
197 "auto_mode is on AUTOMAXBYPERCENT! auto_max_percentile is not in [0,100]. Use setAutoMaxPercentile(<value>) to change it!",
201 std::vector<int> histogram_auto(100, 0);
206 PeakIterator run = scan_first_;
207 while (run != scan_last_)
209 maxInt = std::max(maxInt, (*run).getIntensity());
214 double bin_size = maxInt / 100;
218 while (run != scan_last_)
220 ++histogram_auto[(int) (((*run).getIntensity() - 1) / bin_size)];
226 int elements_seen = 0;
230 while (run != scan_last_ && elements_seen < elements_below_percentile)
233 elements_seen += histogram_auto[i];
246 OPENMS_PRETTY_FUNCTION,
247 "auto_mode is on MANUAL! max_intensity is <=0. Needs to be positive! Use setMaxIntensity(<value>) or enable auto_mode!",
254 std::cerr <<
"TODO SignalToNoiseEstimatorMedian: the max_intensity_ value should be positive! " <<
max_intensity_ << std::endl;
258 PeakIterator window_pos_center = scan_first_;
259 PeakIterator window_pos_borderleft = scan_first_;
260 PeakIterator window_pos_borderright = scan_first_;
262 double window_half_size =
win_len_ / 2;
271 bin_value[bin] = (bin + 0.5) * bin_size;
274 int hist_rightmost_bin;
282 int elements_in_window = 0;
283 int window_count = 0;
288 int windows_overall = 0;
289 PeakIterator run = scan_first_;
290 while (run != scan_last_)
298 while (window_pos_center != scan_last_)
301 while ((*window_pos_borderleft).getMZ() < (*window_pos_center).getMZ() - window_half_size)
304 to_bin = (int) ((std::max((*window_pos_borderleft).getIntensity(), 0.0f)) / bin_size);
305 if (to_bin < bin_count_)
308 --elements_in_window;
310 ++window_pos_borderleft;
317 while ((window_pos_borderright != scan_last_)
318 && ((*window_pos_borderright).getMZ() < (*window_pos_center).getMZ() + window_half_size))
322 to_bin = (int) ((std::max((*window_pos_borderright).getIntensity(), 0.0f)) / bin_size);
323 if (to_bin < bin_count_)
326 ++elements_in_window;
328 ++window_pos_borderright;
334 ++sparse_window_percent;
342 for (
int i = 0; i < 3; ++i)
346 for (
int bin = 0; bin < hist_rightmost_bin; ++bin)
350 hist_mean += histogram[bin] / (
double) elements_in_window * bin_value[bin];
356 for (
int bin = 0; bin < hist_rightmost_bin; ++bin)
358 double tmp(bin_value[bin] - hist_mean);
359 hist_stdev += histogram[bin] / (
double) elements_in_window * tmp * tmp;
361 hist_stdev = std::sqrt(hist_stdev);
364 int estimate = (int) ((hist_mean + hist_stdev *
stdev_ - 1) / bin_size + 1);
366 hist_rightmost_bin = std::min(estimate, bin_count_);
370 noise = std::max(1.0, hist_mean);
374 stn_estimates_[*window_pos_center] = (*window_pos_center).getIntensity() / noise;
388 sparse_window_percent = sparse_window_percent * 100 / window_count;
390 if (sparse_window_percent > 20)
392 std::cerr <<
"WARNING in SignalToNoiseEstimatorMeanIterative: " 393 << sparse_window_percent
394 <<
"% of all windows were sparse. You should consider increasing 'win_len' or increasing 'min_required_elements'" 395 <<
" You should also check the MaximalIntensity value (or the parameters for its heuristic estimation)" 396 <<
" If it is too low, then too many high intensity peaks will be discarded, which leads to a sparse window!" 446 #endif //OPENMS_FILTERING_NOISEESTIMATION_SIGNALTONOISEESTIMATORMEANITERATIVE_H
Param defaults_
Container for default parameters. This member should be filled in the constructor of derived classes!...
Definition: DefaultParamHandler.h:157
void setValue(const String &key, const DataValue &value, const String &description="", const StringList &tags=StringList())
Sets a value.
A more convenient string class.
Definition: String.h:57
double auto_max_stdev_Factor_
parameter for initial automatic estimation of "max_intensity_": a stdev multiplier ...
Definition: SignalToNoiseEstimatorMeanIterative.h:422
Param param_
Container for current parameters.
Definition: DefaultParamHandler.h:150
void endProgress() const
Ends the progress display.
int min_required_elements_
minimal number of elements a window needs to cover to be used
Definition: SignalToNoiseEstimatorMeanIterative.h:434
SignalToNoiseEstimator< Container >::GaussianEstimate GaussianEstimate
Definition: SignalToNoiseEstimatorMeanIterative.h:89
SignalToNoiseEstimator & operator=(const SignalToNoiseEstimator &source)
Assignment operator.
Definition: SignalToNoiseEstimator.h:92
Container::const_iterator PeakIterator
Definition: SignalToNoiseEstimator.h:65
int bin_count_
number of bins in the histogram
Definition: SignalToNoiseEstimatorMeanIterative.h:430
double variance
mean of estimated Gaussian
Definition: SignalToNoiseEstimator.h:170
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:47
virtual void computeSTN_(const PeakIterator &scan_first_, const PeakIterator &scan_last_)
Definition: SignalToNoiseEstimatorMeanIterative.h:172
double mean
Definition: SignalToNoiseEstimator.h:169
bool is_result_valid_
flag: set to true if SignalToNoise estimates are calculated and none of the params were changed...
Definition: SignalToNoiseEstimator.h:215
void setMaxInt(const String &key, Int max)
Sets the maximum value for the integer or integer list parameter key.
GaussianEstimate estimate_(const PeakIterator &scan_first_, const PeakIterator &scan_last_) const
calculate mean & stdev of intensities of a spectrum
Definition: SignalToNoiseEstimator.h:175
Estimates the signal/noise (S/N) ratio of each data point in a scan based on an iterative scheme whic...
Definition: SignalToNoiseEstimatorMeanIterative.h:70
protected struct to store parameters my, sigma for a Gaussian distribution
Definition: SignalToNoiseEstimator.h:167
double auto_max_percentile_
parameter for initial automatic estimation of "max_intensity_" percentile or a stdev ...
Definition: SignalToNoiseEstimatorMeanIterative.h:424
double noise_for_empty_window_
Definition: SignalToNoiseEstimatorMeanIterative.h:437
double win_len_
range of data points which belong to a window in Thomson
Definition: SignalToNoiseEstimatorMeanIterative.h:428
SignalToNoiseEstimatorMeanIterative(const SignalToNoiseEstimatorMeanIterative &source)
Copy Constructor.
Definition: SignalToNoiseEstimatorMeanIterative.h:137
const DataValue & getValue(const String &key) const
Returns a value of a parameter.
void setProgress(SignedSize value) const
Sets the current progress.
void setMaxFloat(const String &key, double max)
Sets the maximum value for the floating point or floating point list parameter key.
virtual ~SignalToNoiseEstimatorMeanIterative()
Destructor.
Definition: SignalToNoiseEstimatorMeanIterative.h:160
SignalToNoiseEstimator< Container >::PeakIterator PeakIterator
Definition: SignalToNoiseEstimatorMeanIterative.h:86
PeakIterator::value_type PeakType
Definition: SignalToNoiseEstimator.h:66
SignalToNoiseEstimatorMeanIterative & operator=(const SignalToNoiseEstimatorMeanIterative &source)
Definition: SignalToNoiseEstimatorMeanIterative.h:147
Definition: SignalToNoiseEstimatorMeanIterative.h:77
Invalid value exception.
Definition: Exception.h:336
int auto_mode_
determines which method shall be used for estimating "max_intensity_". valid are MANUAL=-1, AUTOMAXBYSTDEV=0 or AUTOMAXBYPERCENT=1
Definition: SignalToNoiseEstimatorMeanIterative.h:426
SignalToNoiseEstimator< Container >::PeakType PeakType
Definition: SignalToNoiseEstimatorMeanIterative.h:87
Definition: SignalToNoiseEstimatorMeanIterative.h:77
void setMinInt(const String &key, Int min)
Sets the minimum value for the integer or integer list parameter key.
void startProgress(SignedSize begin, SignedSize end, const String &label) const
Initializes the progress display.
This class represents the abstract base class of a signal to noise estimator.
Definition: SignalToNoiseEstimator.h:57
SignalToNoiseEstimatorMeanIterative()
default constructor
Definition: SignalToNoiseEstimatorMeanIterative.h:93
std::map< PeakType, double, typename PeakType::PositionLess > stn_estimates_
stores the noise estimate for each peak
Definition: SignalToNoiseEstimator.h:208
IntensityThresholdCalculation
method to use for estimating the maximal intensity that is used for histogram calculation ...
Definition: SignalToNoiseEstimatorMeanIterative.h:77
double max_intensity_
maximal intensity considered during binning (values above get discarded)
Definition: SignalToNoiseEstimatorMeanIterative.h:420
void setName(const String &name)
Mutable access to the name.
double stdev_
multiplier for the stdev of intensities
Definition: SignalToNoiseEstimatorMeanIterative.h:432
void setMinFloat(const String &key, double min)
Sets the minimum value for the floating point or floating point list parameter key.
void updateMembers_()
overridden function from DefaultParamHandler to keep members up to date, when a parameter is changed ...
Definition: SignalToNoiseEstimatorMeanIterative.h:405
void defaultsToParam_()
Updates the parameters after the defaults have been set in the constructor.
Definition: SignalToNoiseEstimatorMeanIterative.h:77