root/html606/LDA_8cxx_source.html

 // $Id$

 /**********************************************************************************

  * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

  * Package: TMVA                                                                  *

  * Class  : LDA                                                                   *

  * Web    : http://tmva.sourceforge.net                                           *

  *                                                                                *

  * Description:                                                                   *

  *      Local LDA method used by MethodKNN to compute MVA value.                  *

  *      This is experimental code under development. This class computes          *

  *      parameters of signal and background PDFs using Gaussian aproximation.     *

  *                                                                                *

  * Author:                                                                        *

  *      John Alison John.Alison@cern.ch - University of Pennsylvania, USA         *

  *                                                                                *

  * Copyright (c) 2007:                                                            *

  *      CERN, Switzerland                                                         *

  *      MPI-K Heidelberg, Germany                                                 *

  *      University of Pennsylvania, USA                                           *

  *                                                                                *

  * Redistribution and use in source and binary forms, with or without             *

  * modification, are permitted according to the terms listed in LICENSE           *

  * (http://tmva.sourceforge.net/LICENSE)                                          *

  **********************************************************************************/


 // Local

 #include "TMVA/LDA.h"


 // C/C++

 #include <iostream>


 #ifndef ROOT_TDecompSVD

 #include "TDecompSVD.h"

 #endif

 #ifndef ROOT_TMatrixF

 #include "TMatrixF.h"

 #endif

 #ifndef ROOT_TMath

 #include "TMath.h"

 #endif


 #ifndef ROOT_TMVA_Types

 #include "TMVA/Types.h"

 #endif

 #ifndef ROOT_TMVA_MsgLogger

 #include "TMVA/MsgLogger.h"

 #endif


 ////////////////////////////////////////////////////////////////////////////////

 /// constructor


 TMVA::LDA::LDA( Float_t tolerence, Bool_t debug )

    : fTolerence(tolerence),

      fNumParams(0),

      fSigma(0),

      fSigmaInverse(0),

      fDebug(debug),

      fLogger( new MsgLogger("LDA", (debug?kINFO:kDEBUG)) )

 {

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// destructor


 TMVA::LDA::~LDA()

 {

    delete fLogger;

 }


 ////////////////////////////////////////////////////////////////////////////////

 /// Create LDA matrix using local events found by knn method


 void TMVA::LDA::Initialize(const LDAEvents& inputSignalEvents, const LDAEvents& inputBackgroundEvents)

 {

    Log() << kDEBUG << "There are: " << inputSignalEvents.size() << " input signal events " << Endl;

    Log() << kDEBUG << "There are: " << inputBackgroundEvents.size() << " input background events " << Endl;


    fNumParams = inputSignalEvents[0].size();


    UInt_t numSignalEvents = inputSignalEvents.size();

    UInt_t numBackEvents  = inputBackgroundEvents.size();

    UInt_t numTotalEvents = numSignalEvents + numBackEvents;

    fEventFraction[0] = (Float_t)numBackEvents/numTotalEvents;

    fEventFraction[1] = (Float_t)numSignalEvents/numTotalEvents;

    UInt_t K = 2;


    // get the mean of the signal and background for each parameter

    std::vector<Float_t> m_muSignal (fNumParams,0.0);

    std::vector<Float_t> m_muBackground (fNumParams,0.0);

    for (UInt_t param=0; param < fNumParams; ++param) {

       for (UInt_t eventNumber=0; eventNumber < numSignalEvents; ++eventNumber)

          m_muSignal[param] += inputSignalEvents[eventNumber][param];

       for (UInt_t eventNumber=0; eventNumber < numBackEvents; ++eventNumber)

          m_muBackground[param] += inputBackgroundEvents[eventNumber][param]/numBackEvents;

       if (numSignalEvents > 0) m_muSignal[param] /= numSignalEvents;

       if (numBackEvents > 0 )  m_muBackground[param] /= numBackEvents;

    }

    fMu[0] = m_muBackground;

    fMu[1] = m_muSignal;


    if (fDebug) {

       Log() << kDEBUG << "the signal means" << Endl;

       for (UInt_t param=0; param < fNumParams; ++param)

          Log() << kDEBUG << m_muSignal[param] << Endl;

       Log() << kDEBUG << "the background means" << Endl;

       for (UInt_t param=0; param < inputBackgroundEvents[0].size(); ++param)

          Log() << kDEBUG << m_muBackground[param] << Endl;

    }


    // sigma is a sum of two symmetric matrices, one for the background and one for signal

    // get the matricies seperately (def not be the best way to do it!)


    // the signal, background, and total matrix

    TMatrixF sigmaSignal(fNumParams, fNumParams);

    TMatrixF sigmaBack(fNumParams, fNumParams);

    if (fSigma!=0) delete fSigma;

    fSigma = new TMatrixF(fNumParams, fNumParams);

    for (UInt_t row=0; row < fNumParams; ++row) {

       for (UInt_t col=0; col < fNumParams; ++col) {

          sigmaSignal[row][col] = 0;

          sigmaBack[row][col] = 0;

          (*fSigma)[row][col] = 0;

       }

    }


    for (UInt_t eventNumber=0; eventNumber < numSignalEvents; ++eventNumber) {

       for (UInt_t row=0; row < fNumParams; ++row) {

          for (UInt_t col=0; col < fNumParams; ++col) {

             sigmaSignal[row][col] += (inputSignalEvents[eventNumber][row] - m_muSignal[row]) * (inputSignalEvents[eventNumber][col] - m_muSignal[col] );

          }

       }

    }


    for (UInt_t eventNumber=0; eventNumber < numBackEvents; ++eventNumber) {

       for (UInt_t row=0; row < fNumParams; ++row) {

          for (UInt_t col=0; col < fNumParams; ++col) {

             sigmaBack[row][col] += (inputBackgroundEvents[eventNumber][row] - m_muBackground[row]) * (inputBackgroundEvents[eventNumber][col] - m_muBackground[col] );

          }

       }

    }


    // the total matrix

    *fSigma = sigmaBack + sigmaSignal;

    *fSigma *= 1.0/(numTotalEvents - K);


    if (fDebug) {

       Log() << "after filling sigmaSignal" <<Endl;

       sigmaSignal.Print();

       Log() << "after filling sigmaBack" <<Endl;

       sigmaBack.Print();

       Log() << "after filling total Sigma" <<Endl;

       fSigma->Print();

    }


    TDecompSVD solutionSVD = TDecompSVD( *fSigma );

    TMatrixF   decomposed  = TMatrixF( fNumParams, fNumParams );

    TMatrixF diag  ( fNumParams, fNumParams );

    TMatrixF uTrans( fNumParams, fNumParams );

    TMatrixF vTrans( fNumParams, fNumParams );

    if (solutionSVD.Decompose()) {

       for (UInt_t i = 0; i< fNumParams; ++i) {

          if (solutionSVD.GetSig()[i] > fTolerence)

             diag(i,i) = solutionSVD.GetSig()[i];

          else

             diag(i,i) = fTolerence;

       }


       if (fDebug) {

          Log() << "the diagonal" <<Endl;

          diag.Print();

       }


       decomposed = solutionSVD.GetV();

       decomposed *= diag;

       decomposed *= solutionSVD.GetU();


       if (fDebug) {

          Log() << "the decomposition " <<Endl;

          decomposed.Print();

       }


       *fSigmaInverse = uTrans.Transpose(solutionSVD.GetU());

       *fSigmaInverse /= diag;

       *fSigmaInverse *= vTrans.Transpose(solutionSVD.GetV());


       if (fDebug) {

          Log() << "the SigmaInverse " <<Endl;

          fSigmaInverse->Print();


          Log() << "the real " <<Endl;

          fSigma->Invert();

          fSigma->Print();


          Bool_t problem = false;

          for (UInt_t i =0; i< fNumParams; ++i) {

             for (UInt_t j =0; j< fNumParams; ++j) {

                if (TMath::Abs((Float_t)(*fSigma)(i,j) - (Float_t)(*fSigmaInverse)(i,j)) > 0.01) {

                   Log() << "problem, i= "<< i << " j= " << j << Endl;

                   Log() << "Sigma(i,j)= "<< (*fSigma)(i,j) << " SigmaInverse(i,j)= " << (*fSigmaInverse)(i,j) <<Endl;

                   Log() << "The difference is : " << TMath::Abs((Float_t)(*fSigma)(i,j) - (Float_t)(*fSigmaInverse)(i,j)) <<Endl;

                   problem = true;

                }

             }

          }

          if (problem) Log() << kWARNING << "Problem with the inversion!" << Endl;


       }

    }

 }


 ////////////////////////////////////////////////////////////////////////////////

 ///

 /// Probability value using Gaussian approximation

 ///


 Float_t TMVA::LDA::FSub(const std::vector<Float_t>& x, Int_t k)

 {

    Float_t prefactor  = 1.0/(TMath::TwoPi()*TMath::Sqrt(fSigma->Determinant()));

    std::vector<Float_t> m_transPoseTimesSigmaInverse;


    for (UInt_t j=0; j < fNumParams; ++j) {

       Float_t m_temp = 0;

       for (UInt_t i=0; i < fNumParams; ++i) {

          m_temp += (x[i] - fMu[k][i]) * (*fSigmaInverse)(j,i);

       }

       m_transPoseTimesSigmaInverse.push_back(m_temp);

    }


    Float_t exponent = 0.0;

    for (UInt_t i=0; i< fNumParams; ++i) {

       exponent += m_transPoseTimesSigmaInverse[i]*(x[i] - fMu[k][i]);

    }


    exponent *= -0.5;


    return prefactor*TMath::Exp( exponent );

 }


 ////////////////////////////////////////////////////////////////////////////////

 ///

 /// Signal probability with Gaussian approximation

 ///


 Float_t TMVA::LDA::GetProb(const std::vector<Float_t>& x, Int_t k)

 {

    Float_t m_numerator = FSub(x,k)*fEventFraction[k];

    Float_t m_denominator = FSub(x,0)*fEventFraction[0]+FSub(x,1)*fEventFraction[1];


    return m_numerator/m_denominator;

 }


 ////////////////////////////////////////////////////////////////////////////////

 ///

 /// Log likelihood function with Gaussian approximation

 ///


 Float_t TMVA::LDA::GetLogLikelihood( const std::vector<Float_t>& x, Int_t k )

 {

    return TMath::Log( FSub(x,k)/FSub(x,!k) ) + TMath::Log( fEventFraction[k]/fEventFraction[!k] );

 }

TMVA::LDA::LDA
LDA(Float_t tolerence=1.0e-5, Bool_t debug=false)
constructor
Definition: LDA.cxx:52

TMVA::LDA::FSub
Float_t FSub(const std::vector< Float_t > &x, Int_t k)
Probability value using Gaussian approximation.
Definition: LDA.cxx:216

TDecompSVD::GetSig
const TVectorD & GetSig()
Definition: TDecompSVD.h:61

TMVA::Endl
MsgLogger & Endl(MsgLogger &ml)
Definition: MsgLogger.h:162

Types.h

TMatrixT::Transpose
TMatrixT< Element > & Transpose(const TMatrixT< Element > &source)
Transpose matrix source.
Definition: TMatrixT.cxx:1460

TMVA::LDA::~LDA
~LDA()
destructor
Definition: LDA.cxx:65

TMath::Log
Double_t Log(Double_t x)
Definition: TMath.h:526

Float_t
float Float_t
Definition: RtypesCore.h:53

TMatrixF
TMatrixT< Float_t > TMatrixF
Definition: TMatrixFfwd.h:24

Int_t
int Int_t
Definition: RtypesCore.h:41

Bool_t
bool Bool_t
Definition: RtypesCore.h:59

TMath::Abs
Short_t Abs(Short_t d)
Definition: TMathBase.h:110

TMatrixT
Definition: TMatrixDfwd.h:24

TDecompSVD
Definition: TDecompSVD.h:25

x
Double_t x[n]
Definition: legend1.C:17

TMVA::kDEBUG
Definition: Types.h:62

TMVA::LDA::GetProb
Float_t GetProb(const std::vector< Float_t > &x, Int_t k)
Signal probability with Gaussian approximation.
Definition: LDA.cxx:244

TMath::TwoPi
Double_t TwoPi()
Definition: TMath.h:45

TDecompSVD::GetU
const TMatrixD & GetU()
Definition: TDecompSVD.h:57

TDecompSVD::Decompose
virtual Bool_t Decompose()
SVD decomposition of matrix If the decomposition succeeds, bit kDecomposed is set ...
Definition: TDecompSVD.cxx:121

TObject::Print
virtual void Print(Option_t *option="") const
This method must be overridden when a class wants to print itself.
Definition: TObject.cxx:594

TMatrixTBase::Print
void Print(Option_t *name="") const
Print the matrix as a table of elements.
Definition: TMatrixTBase.cxx:815

TMVA::LDA::GetLogLikelihood
Float_t GetLogLikelihood(const std::vector< Float_t > &x, Int_t k)
Log likelihood function with Gaussian approximation.
Definition: LDA.cxx:257

UInt_t
unsigned int UInt_t
Definition: RtypesCore.h:42

TMath::K
Double_t K()
Definition: TMath.h:95

MsgLogger.h

TMVA::LDA::Initialize
void Initialize(const LDAEvents &inputSignal, const LDAEvents &inputBackground)
Create LDA matrix using local events found by knn method.
Definition: LDA.cxx:73

TMath::Exp
Double_t Exp(Double_t x)
Definition: TMath.h:495

LDA.h

TMVA::MsgLogger
Definition: MsgLogger.h:63

ROOT::Vc::AVX::Internal::exponent
Vc_INTRINSIC Vc_CONST m256 exponent(param256 v)
Definition: vectorhelper.h:37

LDAEvents
std::vector< std::vector< Float_t > > LDAEvents
Definition: LDA.h:42

TMatrixF.h

debug
bool debug
Definition: testSampleQuantiles.cxx:13

TDecompSVD::GetV
const TMatrixD & GetV()
Definition: TDecompSVD.h:59

TMath::Sqrt
Double_t Sqrt(Double_t x)
Definition: TMath.h:464

TMath.h

TMVA::kINFO
Definition: Types.h:64

TMVA::kWARNING
Definition: Types.h:65

Log
Definition: math.cpp:60

TDecompSVD.h