nightly/html/GaussFilterAlgorithm_8h_source.html

 // Copyright (c) 2002-present, OpenMS Inc. -- EKU Tuebingen, ETH Zurich, and FU Berlin

 // SPDX-License-Identifier: BSD-3-Clause

 //

 // --------------------------------------------------------------------------

 // $Maintainer: Hannes Roest $

 // $Authors: Eva Lange $

 // --------------------------------------------------------------------------


 #pragma once


 #include <OpenMS/CONCEPT/Types.h>

 #include <OpenMS/CONCEPT/Constants.h>

 #include <OpenMS/INTERFACES/DataStructures.h>

 #include <OpenMS/MATH/MathFunctions.h>


 #include <cmath>

 #include <vector>


 #include <iostream>


 namespace OpenMS

 {

 // #define DEBUG_FILTERING


   class OPENMS_DLLAPI GaussFilterAlgorithm

   {

 public:

     GaussFilterAlgorithm();


     virtual ~GaussFilterAlgorithm();


     bool filter(OpenMS::Interfaces::SpectrumPtr spectrum)

     {

       // create new arrays for mz / intensity data and set their size

       OpenMS::Interfaces::BinaryDataArrayPtr intensity_array(new OpenMS::Interfaces::BinaryDataArray);

       OpenMS::Interfaces::BinaryDataArrayPtr mz_array(new OpenMS::Interfaces::BinaryDataArray);

       mz_array->data.resize(spectrum->getMZArray()->data.size());

       intensity_array->data.resize(spectrum->getMZArray()->data.size());


       // apply the filter

       bool ret_val = filter(

           spectrum->getMZArray()->data.begin(),

           spectrum->getMZArray()->data.end(),

           spectrum->getIntensityArray()->data.begin(),

           mz_array->data.begin(), intensity_array->data.begin()

           );

       // set the data of the spectrum to the new mz / int arrays

       spectrum->setMZArray(mz_array);

       spectrum->setIntensityArray(intensity_array);

       return ret_val;

     }


     bool filter(OpenMS::Interfaces::ChromatogramPtr chromatogram)

     {

       // create new arrays for rt / intensity data and set their size

       OpenMS::Interfaces::BinaryDataArrayPtr intensity_array(new OpenMS::Interfaces::BinaryDataArray);

       OpenMS::Interfaces::BinaryDataArrayPtr rt_array(new OpenMS::Interfaces::BinaryDataArray);

       rt_array->data.resize(chromatogram->getTimeArray()->data.size());

       intensity_array->data.resize(chromatogram->getTimeArray()->data.size());


       // apply the filter

       bool ret_val = filter(

           chromatogram->getTimeArray()->data.begin(),

           chromatogram->getTimeArray()->data.end(),

           chromatogram->getIntensityArray()->data.begin(),

           rt_array->data.begin(), intensity_array->data.begin()

           );

       // set the data of the chromatogram to the new rt / int arrays

       chromatogram->setTimeArray(rt_array);

       chromatogram->setIntensityArray(intensity_array);

       return ret_val;

     }


     template <typename ConstIterT, typename IterT>

     bool filter(

         ConstIterT mz_in_start,

         ConstIterT mz_in_end,

         ConstIterT int_in_start,

         IterT mz_out,

         IterT int_out)

     {

       bool found_signal = false;


       ConstIterT mz_it = mz_in_start;

       ConstIterT int_it = int_in_start;

       for (; mz_it != mz_in_end; mz_it++, int_it++)

       {

         // if ppm tolerance is used, calculate a reasonable width value for this m/z

         if (use_ppm_tolerance_)

         {

           initialize(Math::ppmToMass(ppm_tolerance_, *mz_it), spacing_, ppm_tolerance_, use_ppm_tolerance_);

         }


         double new_int = integrate_(mz_it, int_it, mz_in_start, mz_in_end);


         // store new intensity and m/z into output iterator

         *mz_out = *mz_it;

         *int_out = new_int;

         ++mz_out;

         ++int_out;


         if (fabs(new_int) > 0) found_signal = true;

       }

       return found_signal;

     }


     void initialize(double gaussian_width, double spacing, double ppm_tolerance, bool use_ppm_tolerance);


 protected:


     std::vector<double> coeffs_;

     double sigma_;

     double spacing_;


     // tolerance in ppm

     bool use_ppm_tolerance_;

     double ppm_tolerance_;


     template <typename InputPeakIterator>

     double integrate_(InputPeakIterator x /* mz */, InputPeakIterator y /* int */, InputPeakIterator first, InputPeakIterator last)

     {

       double v = 0.;

       // norm the gaussian kernel area to one

       double norm = 0.;

       Size middle = coeffs_.size();


       double start_pos = (( (*x) - (middle * spacing_)) > (*first)) ? ((*x) - (middle * spacing_)) : (*first);

       double end_pos = (( (*x) + (middle * spacing_)) < (*(last - 1))) ? ((*x) + (middle * spacing_)) : (*(last - 1));


       InputPeakIterator help_x = x;

       InputPeakIterator help_y = y;

 #ifdef DEBUG_FILTERING


       std::cout << "integrate from middle to start_pos " << *help_x << " until " << start_pos << std::endl;

 #endif


       //integrate from middle to start_pos

       while ((help_x != first) && (*(help_x - 1) > start_pos))

       {

         // search for the corresponding datapoint of help in the gaussian (take the left most adjacent point)

         double distance_in_gaussian = fabs(*x - *help_x);

         Size left_position = (Size)floor(distance_in_gaussian / spacing_);


         // search for the true left adjacent data point (because of rounding errors)

         for (int j = 0; ((j < 3) &&  (distance(first, help_x - j) >= 0)); ++j)

         {

           if (((left_position - j) * spacing_ <= distance_in_gaussian) && ((left_position - j + 1) * spacing_ >= distance_in_gaussian))

           {

             left_position -= j;

             break;

           }


           if (((left_position + j) * spacing_ < distance_in_gaussian) && ((left_position + j + 1) * spacing_ < distance_in_gaussian))

           {

             left_position += j;

             break;

           }

         }


         // interpolate between the left and right data points in the gaussian to get the true value at position distance_in_gaussian

         Size right_position = left_position + 1;

         double d = fabs((left_position * spacing_) - distance_in_gaussian) / spacing_;

         // check if the right data point in the gaussian exists

         double coeffs_right = (right_position < middle) ? (1 - d) * coeffs_[left_position] + d * coeffs_[right_position]

                                   : coeffs_[left_position];

 #ifdef DEBUG_FILTERING


         std::cout << "distance_in_gaussian " << distance_in_gaussian << std::endl;

         std::cout << " right_position " << right_position << std::endl;

         std::cout << " left_position " << left_position << std::endl;

         std::cout << "coeffs_ at left_position "  <<  coeffs_[left_position] << std::endl;

         std::cout << "coeffs_ at right_position "  <<  coeffs_[right_position] << std::endl;

         std::cout << "interpolated value left " << coeffs_right << std::endl;

 #endif


         // search for the corresponding datapoint for (help-1) in the gaussian (take the left most adjacent point)

         distance_in_gaussian = fabs((*x) - (*(help_x - 1)));

         left_position = (Size)floor(distance_in_gaussian / spacing_);


         // search for the true left adjacent data point (because of rounding errors)

         for (UInt j = 0; ((j < 3) && (distance(first, help_x - j) >= 0)); ++j)

         {

           if (((left_position - j) * spacing_ <= distance_in_gaussian) && ((left_position - j + 1) * spacing_ >= distance_in_gaussian))

           {

             left_position -= j;

             break;

           }


           if (((left_position + j) * spacing_ < distance_in_gaussian) && ((left_position + j + 1) * spacing_ < distance_in_gaussian))

           {

             left_position += j;

             break;

           }

         }


         // start the interpolation for the true value in the gaussian

         right_position = left_position + 1;

         d = fabs((left_position * spacing_) - distance_in_gaussian) / spacing_;

         double coeffs_left = (right_position < middle) ? (1 - d) * coeffs_[left_position] + d * coeffs_[right_position]

                                  : coeffs_[left_position];

 #ifdef DEBUG_FILTERING


         std::cout << " help_x-1 " << *(help_x - 1) << " distance_in_gaussian " << distance_in_gaussian << std::endl;

         std::cout << " right_position " << right_position << std::endl;

         std::cout << " left_position " << left_position << std::endl;

         std::cout << "coeffs_ at left_position " <<  coeffs_[left_position] << std::endl;

         std::cout << "coeffs_ at right_position " <<   coeffs_[right_position] << std::endl;

         std::cout << "interpolated value right " << coeffs_left << std::endl;


         std::cout << " intensity " << fabs(*(help_x - 1) - (*help_x)) / 2. << " * " << *(help_y - 1) << " * " << coeffs_left << " + " << *help_y << "* " << coeffs_right

                   << std::endl;

 #endif


         norm += fabs((*(help_x - 1)) - (*help_x)) / 2. * (coeffs_left + coeffs_right);


         v += fabs((*(help_x - 1)) - (*help_x)) / 2. * (*(help_y - 1) * coeffs_left + (*help_y) * coeffs_right);

         --help_x;

         --help_y;

       }


       //integrate from middle to end_pos

       help_x = x;

       help_y = y;

 #ifdef DEBUG_FILTERING


       std::cout << "integrate from middle to endpos " << *help_x << " until " << end_pos << std::endl;

 #endif


       while ((help_x != (last - 1)) && (*(help_x + 1) < end_pos))

       {

         // search for the corresponding datapoint for help in the gaussian (take the left most adjacent point)

         double distance_in_gaussian = fabs((*x) - (*help_x));

         int left_position = (UInt)floor(distance_in_gaussian / spacing_);


         // search for the true left adjacent data point (because of rounding errors)

         for (int j = 0; ((j < 3) && (distance(help_x + j, last - 1) >= 0)); ++j)

         {

           if (((left_position - j) * spacing_ <= distance_in_gaussian) && ((left_position - j + 1) * spacing_ >= distance_in_gaussian))

           {

             left_position -= j;

             break;

           }


           if (((left_position + j) * spacing_ < distance_in_gaussian) && ((left_position + j + 1) * spacing_ < distance_in_gaussian))

           {

             left_position += j;

             break;

           }

         }

         // start the interpolation for the true value in the gaussian

         Size right_position = left_position + 1;

         double d = fabs((left_position * spacing_) - distance_in_gaussian) / spacing_;

         double coeffs_left = (right_position < middle) ? (1 - d) * coeffs_[left_position] + d * coeffs_[right_position]

                                  : coeffs_[left_position];


 #ifdef DEBUG_FILTERING


         std::cout << " help " << *help_x << " distance_in_gaussian " << distance_in_gaussian << std::endl;

         std::cout << " left_position " << left_position << std::endl;

         std::cout << "coeffs_ at right_position " <<  coeffs_[left_position] << std::endl;

         std::cout << "coeffs_ at left_position " <<  coeffs_[right_position] << std::endl;

         std::cout << "interpolated value left " << coeffs_left << std::endl;

 #endif


         // search for the corresponding datapoint for (help+1) in the gaussian (take the left most adjacent point)

         distance_in_gaussian = fabs((*x) - (*(help_x + 1)));

         left_position = (UInt)floor(distance_in_gaussian / spacing_);


         // search for the true left adjacent data point (because of rounding errors)

         for (int j = 0; ((j < 3) && (distance(help_x + j, last - 1) >= 0)); ++j)

         {

           if (((left_position - j) * spacing_ <= distance_in_gaussian) && ((left_position - j + 1) * spacing_ >= distance_in_gaussian))

           {

             left_position -= j;

             break;

           }


           if (((left_position + j) * spacing_ < distance_in_gaussian) && ((left_position + j + 1) * spacing_ < distance_in_gaussian))

           {

             left_position += j;

             break;

           }

         }


         // start the interpolation for the true value in the gaussian

         right_position = left_position + 1;

         d = fabs((left_position * spacing_) - distance_in_gaussian) / spacing_;

         double coeffs_right = (right_position < middle) ? (1 - d) * coeffs_[left_position] + d * coeffs_[right_position]

                                   : coeffs_[left_position];

 #ifdef DEBUG_FILTERING


         std::cout << " (help + 1) " << *(help_x + 1) << " distance_in_gaussian " << distance_in_gaussian << std::endl;

         std::cout << " left_position " << left_position << std::endl;

         std::cout << "coeffs_ at right_position " <<   coeffs_[left_position] << std::endl;

         std::cout << "coeffs_ at left_position " <<  coeffs_[right_position] << std::endl;

         std::cout << "interpolated value right " << coeffs_right << std::endl;


         std::cout << " intensity " <<  fabs(*help_x - *(help_x + 1)) / 2.

                   << " * " << *help_y << " * " << coeffs_left << " + " << *(help_y + 1)

                   << "* " << coeffs_right

                   << std::endl;

 #endif

         norm += fabs((*help_x) - (*(help_x + 1)) ) / 2. * (coeffs_left + coeffs_right);


         v += fabs((*help_x) - (*(help_x + 1)) ) / 2. * ((*help_y) * coeffs_left + (*(help_y + 1)) * coeffs_right);

         ++help_x;

         ++help_y;

       }


       if (v > 0)

       {

         return v / norm;

       }

       else

       {

         return 0;

       }

     }


   };


 } // namespace OpenMS

Constants.h

MathFunctions.h

Types.h

OpenMS::GaussFilterAlgorithm
This class represents a Gaussian lowpass-filter which works on uniform as well as on non-uniform prof...
Definition: GaussFilterAlgorithm.h:48

OpenMS::GaussFilterAlgorithm::coeffs_
std::vector< double > coeffs_
Coefficients.
Definition: GaussFilterAlgorithm.h:147

OpenMS::GaussFilterAlgorithm::GaussFilterAlgorithm
GaussFilterAlgorithm()
Constructor.

OpenMS::GaussFilterAlgorithm::initialize
void initialize(double gaussian_width, double spacing, double ppm_tolerance, bool use_ppm_tolerance)

OpenMS::GaussFilterAlgorithm::sigma_
double sigma_
The standard derivation .
Definition: GaussFilterAlgorithm.h:149

OpenMS::GaussFilterAlgorithm::filter
bool filter(ConstIterT mz_in_start, ConstIterT mz_in_end, ConstIterT int_in_start, IterT mz_out, IterT int_out)
Smoothes two data arrays.
Definition: GaussFilterAlgorithm.h:110

OpenMS::GaussFilterAlgorithm::integrate_
double integrate_(InputPeakIterator x, InputPeakIterator y, InputPeakIterator first, InputPeakIterator last)
Computes the convolution of the raw data at position x and the gaussian kernel.
Definition: GaussFilterAlgorithm.h:159

OpenMS::GaussFilterAlgorithm::spacing_
double spacing_
The spacing of the pre-tabulated kernel coefficients.
Definition: GaussFilterAlgorithm.h:151

OpenMS::GaussFilterAlgorithm::ppm_tolerance_
double ppm_tolerance_
Definition: GaussFilterAlgorithm.h:155

OpenMS::GaussFilterAlgorithm::~GaussFilterAlgorithm
virtual ~GaussFilterAlgorithm()
Destructor.

OpenMS::GaussFilterAlgorithm::use_ppm_tolerance_
bool use_ppm_tolerance_
Definition: GaussFilterAlgorithm.h:154

OpenMS::GaussFilterAlgorithm::filter
bool filter(OpenMS::Interfaces::SpectrumPtr spectrum)
Smoothes an Spectrum containing profile data.
Definition: GaussFilterAlgorithm.h:59

OpenMS::GaussFilterAlgorithm::filter
bool filter(OpenMS::Interfaces::ChromatogramPtr chromatogram)
Smoothes an Chromatogram containing profile data.
Definition: GaussFilterAlgorithm.h:83

OpenMS::UInt
unsigned int UInt
Unsigned integer type.
Definition: Types.h:64

OpenMS::Size
size_t Size
Size type e.g. used as variable which can hold result of size()
Definition: Types.h:97

OpenMS::Interfaces::ChromatogramPtr
std::shared_ptr< Chromatogram > ChromatogramPtr
Definition: openms/include/OpenMS/INTERFACES/DataStructures.h:130

OpenMS::Interfaces::SpectrumPtr
std::shared_ptr< Spectrum > SpectrumPtr
Definition: openms/include/OpenMS/INTERFACES/DataStructures.h:210

OpenMS::Interfaces::BinaryDataArrayPtr
std::shared_ptr< BinaryDataArray > BinaryDataArrayPtr
Definition: openms/include/OpenMS/INTERFACES/DataStructures.h:54

OpenMS::Interfaces::BinaryDataArray
The datastructures used by the OpenSwath interfaces.
Definition: openms/include/OpenMS/INTERFACES/DataStructures.h:47

OpenMS::Math::ppmToMass
T ppmToMass(T ppm, T mz_ref)
Compute the mass diff in [Th], given a ppm value and a reference point.
Definition: MathFunctions.h:404

OpenMS
Main OpenMS namespace.
Definition: openswathalgo/include/OpenMS/OPENSWATHALGO/DATAACCESS/ISpectrumAccess.h:19

OpenSwath::norm
double norm(T beg, T end)
compute the Euclidean norm of the vector
Definition: StatsHelpers.h:31

DataStructures.h