2.2.0/bpp-core/LowMemoryRescaledHmmLikelihood_8cpp_source.html

 //
 // File: LowMemoryRescaledHmmLikelihood.h
 // Created by: Julien Dutheil
 // Created on: Wed Dec 16 10:47 2009
 //

 /*
    Copyright or © or Copr. Bio++ Development Team, (November 16, 2004)

    This software is a computer program whose purpose is to provide classes
    for phylogenetic data analysis.

    This software is governed by the CeCILL  license under French law and
    abiding by the rules of distribution of free software.  You can  use,
    modify and/ or redistribute the software under the terms of the CeCILL
    license as circulated by CEA, CNRS and INRIA at the following URL
    "http://www.cecill.info".

    As a counterpart to the access to the source code and  rights to copy,
    modify and redistribute granted by the license, users are provided only
    with a limited warranty  and the software's author,  the holder of the
    economic rights,  and the successive licensors  have only  limited
    liability.

    In this respect, the user's attention is drawn to the risks associated
    with loading,  using,  modifying and/or developing or reproducing the
    software by the user in light of its specific status of free software,
    that may mean  that it is complicated to manipulate,  and  that  also
    therefore means  that it is reserved for developers  and  experienced
    professionals having in-depth computer knowledge. Users are therefore
    encouraged to load and test the software's suitability as regards their
    requirements in conditions enabling the security of their systems and/or
    data to be ensured and,  more generally, to use and operate it in the
    same conditions as regards security.

    The fact that you are presently reading this means that you have had
    knowledge of the CeCILL license and that you accept its terms.
  */

 #include "LowMemoryRescaledHmmLikelihood.h"

 // from the STL:
 #include <iostream>
 #include <algorithm>
 using namespace bpp;
 using namespace std;

 LowMemoryRescaledHmmLikelihood::LowMemoryRescaledHmmLikelihood(
   HmmStateAlphabet* hiddenAlphabet,
   HmmTransitionMatrix* transitionMatrix,
   HmmEmissionProbabilities* emissionProbabilities,
   const std::string& prefix,
   size_t maxSize) throw (Exception) :
   AbstractHmmLikelihood(),
   AbstractParametrizable(prefix),
   hiddenAlphabet_(hiddenAlphabet),
   transitionMatrix_(transitionMatrix),
   emissionProbabilities_(emissionProbabilities),
   likelihood1_(),
   likelihood2_(),
   logLik_(),
   maxSize_(maxSize),
   breakPoints_(),
   nbStates_(),
   nbSites_()
 {
   if (!hiddenAlphabet) throw Exception("LowMemoryRescaledHmmLikelihood: null pointer passed for HmmStateAlphabet.");
   if (!transitionMatrix) throw Exception("LowMemoryRescaledHmmLikelihood: null pointer passed for HmmTransitionMatrix.");
   if (!emissionProbabilities) throw Exception("LowMemoryRescaledHmmLikelihood: null pointer passed for HmmEmissionProbabilities.");
   if (!hiddenAlphabet_->worksWith(transitionMatrix->getHmmStateAlphabet()))
     throw Exception("LowMemoryRescaledHmmLikelihood: HmmTransitionMatrix and HmmEmissionProbabilities should point toward the same HmmStateAlphabet object.");
   if (!hiddenAlphabet_->worksWith(emissionProbabilities->getHmmStateAlphabet()))
     throw Exception("LowMemoryRescaledHmmLikelihood: HmmTransitionMatrix and HmmEmissionProbabilities should point toward the same HmmStateAlphabet object.");
   nbStates_ = hiddenAlphabet_->getNumberOfStates();
   nbSites_ = emissionProbabilities_->getNumberOfPositions();

   // Manage parameters:
   addParameters_(hiddenAlphabet_->getParameters());
   addParameters_(transitionMatrix_->getParameters());
   addParameters_(emissionProbabilities_->getParameters());

   // Init arrays:
   likelihood1_.resize(nbStates_);
   likelihood2_.resize(nbStates_);

   // Compute:
   computeForward_();
 }

 void LowMemoryRescaledHmmLikelihood::fireParameterChanged(const ParameterList& pl)
 {
    bool alphabetChanged    = hiddenAlphabet_->matchParametersValues(pl);
    bool transitionsChanged = transitionMatrix_->matchParametersValues(pl);
    bool emissionChanged    = emissionProbabilities_->matchParametersValues(pl);
   // these lines are necessary because the transitions and emissions can depend on the alphabet.
   // we could use a StateChangeEvent, but this would result in computing some calculations twice in some cases
   // (when both the alphabet and other parameter changed).
   if (alphabetChanged && !transitionsChanged) transitionMatrix_->setParametersValues(transitionMatrix_->getParameters());
   if (alphabetChanged && !emissionChanged) emissionProbabilities_->setParametersValues(emissionProbabilities_->getParameters());

   computeForward_();
 }

 /***************************************************************************************************************************/

 void LowMemoryRescaledHmmLikelihood::computeForward_()
 {
   double x;
   vector<double> tmp(nbStates_);
   vector<double> lScales(min(maxSize_, nbSites_));
   vector<double> trans(nbStates_ * nbStates_);

   // Transition probabilities:
   for (size_t i = 0; i < nbStates_; i++)
   {
    size_t ii = i * nbStates_;
     for (size_t j = 0; j < nbStates_; j++)
     {
       trans[ii + j] = transitionMatrix_->Pij(j, i);
     }
   }

   // Initialisation:
   double scale = 0;
   const vector<double>* emissions = &(*emissionProbabilities_)(0);
   for (size_t j = 0; j < nbStates_; j++)
   {
     size_t jj = j * nbStates_;
     x = 0;
     for (size_t k = 0; k < nbStates_; k++)
     {
       x += trans[k + jj] * transitionMatrix_->getEquilibriumFrequencies()[k];
     }
     tmp[j] = (*emissions)[j] * x;
     scale += tmp[j];
   }
   for (size_t j = 0; j < nbStates_; j++)
   {
     likelihood1_[j] = tmp[j] / scale;
   }
   lScales[0] = log(scale);

   vector<double>* previousLikelihood = &likelihood2_, * currentLikelihood = &likelihood1_, * tmpLikelihood;

   // Recursion:
   size_t nextBrkPt = nbSites_; // next break point
   vector<size_t>::const_iterator bpIt = breakPoints_.begin();
   if (bpIt != breakPoints_.end()) nextBrkPt = *bpIt;

   double a;
   logLik_ = 0;
   size_t offset = 0;
   greater<double> cmp;
   for (size_t i = 1; i < nbSites_; i++)
   {
     //Swap pointers:
     tmpLikelihood = previousLikelihood;
     previousLikelihood = currentLikelihood;
     currentLikelihood = tmpLikelihood;

     scale = 0;
     emissions = &(*emissionProbabilities_)(i);
     if (i < nextBrkPt)
     {
       for (size_t j = 0; j < nbStates_; j++)
       {
         size_t jj = j * nbStates_;
         x = 0;
         for (size_t k = 0; k < nbStates_; k++)
         {
           a = trans[jj + k] * (*previousLikelihood)[k];
           if (a < 0)
           {
             // *ApplicationTools::warning << "Negative value for likelihood at " << i << ", state " << j << ": " << _likelihood[i-1][k] << ", Pij = " << _hiddenModel->Pij(k, j) << endl;
             a = 0;
           }
           x += a;
         }
         tmp[j] = (*emissions)[j] * x;
         if (tmp[j] < 0)
         {
           // *ApplicationTools::warning << "Negative emission probability at " << i << ", state " << j << ": " << _emissions[i][j] << endl;
           tmp[j] = 0;
         }
         scale += tmp[j];
       }
     }
     else // Reset markov chain:
     {
       for (size_t j = 0; j < nbStates_; j++)
       {
         size_t jj = j * nbStates_;
         x = 0;
         for (size_t k = 0; k < nbStates_; k++)
         {
           a = trans[jj + k] * transitionMatrix_->getEquilibriumFrequencies()[k];
           if (a < 0)
           {
             // *ApplicationTools::warning << "Negative value for likelihood at " << i << ", state " << j << ": " << _likelihood[i-1][k] << ", Pij = " << _hiddenModel->Pij(k, j) << endl;
             a = 0;
           }
           x += a;
         }
         tmp[j] = (*emissions)[j] * x;
         if (tmp[j] < 0)
         {
           // *ApplicationTools::warning << "Negative emission probability at " << i << ", state " << j << ": " << _emissions[i][j] << endl;
           tmp[j] = 0;
         }
         scale += tmp[j];
       }
       bpIt++;
       if (bpIt != breakPoints_.end()) nextBrkPt = *bpIt;
       else nextBrkPt = nbSites_;
     }

     for (size_t j = 0; j < nbStates_; j++)
     {
       if (scale > 0) (*currentLikelihood)[j] = tmp[j] / scale;
       else (*currentLikelihood)[j] = 0;
     }
     lScales[i - offset] = log(scale);

     if (i - offset == maxSize_ - 1)
     {
       //We make partial calculations and reset the arrays:
       double partialLogLik = 0;
       sort(lScales.begin(), lScales.end(), cmp);
       for (size_t j = 0; j < maxSize_; ++j)
       {
         partialLogLik += lScales[j];
       }
       logLik_ += partialLogLik;
       offset += maxSize_;
     }
   }
   sort(lScales.begin(), lScales.begin() + static_cast<ptrdiff_t>(nbSites_ - offset), cmp);
   double partialLogLik = 0;
   for (size_t i = 0; i < nbSites_ - offset; ++i)
   {
     partialLogLik += lScales[i];
   }
   logLik_ += partialLogLik;
 }

 /***************************************************************************************************************************/

bpp::HmmStateAlphabet
Hidden states alphabet.
Definition: HmmStateAlphabet.h:62

bpp
This class allows to perform a correspondence analysis.
Definition: ApplicationTools.h:58

bpp::AbstractParametrizable
A partial implementation of the Parametrizable interface.
Definition: AbstractParametrizable.h:62

bpp::HmmEmissionProbabilities
Interface for computing emission probabilities in a Hidden Markov Model.
Definition: HmmEmissionProbabilities.h:64

std
STL namespace.

bpp::ParameterList
The parameter list object.
Definition: ParameterList.h:61

bpp::AbstractHmmLikelihood
Definition: HmmLikelihood.h:139

bpp::Exception
Exception base class.
Definition: Exceptions.h:57

bpp::LowMemoryRescaledHmmLikelihood::LowMemoryRescaledHmmLikelihood
LowMemoryRescaledHmmLikelihood(HmmStateAlphabet *hiddenAlphabet, HmmTransitionMatrix *transitionMatrix, HmmEmissionProbabilities *emissionProbabilities, const std::string &prefix, size_t maxSize=1000000)
Build a new LowMemoryRescaledHmmLikelihood object.
Definition: LowMemoryRescaledHmmLikelihood.cpp:48

LowMemoryRescaledHmmLikelihood.h

bpp::LowMemoryRescaledHmmLikelihood::computeForward_
void computeForward_()
Definition: LowMemoryRescaledHmmLikelihood.cpp:106

bpp::LowMemoryRescaledHmmLikelihood::fireParameterChanged
void fireParameterChanged(const ParameterList &pl)
Notify the class when one or several parameters have changed.
Definition: LowMemoryRescaledHmmLikelihood.cpp:90

bpp::HmmTransitionMatrix
Describe the transition probabilities between hidden states of a Hidden Markov Model.
Definition: HmmTransitionMatrix.h:59