doc/v620/tmva_2tmva_2src_2Factory_8cxx_source.html

// @(#)Root/tmva $Id$

// Author: Andreas Hoecker, Peter Speckmayer, Joerg Stelzer, Helge Voss, Kai Voss, Eckhard von Toerne, Jan Therhaag

// Updated by: Omar Zapata, Kim Albertsson

/**********************************************************************************

 * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

 * Package: TMVA                                                                  *

 * Class  : Factory                                                               *

 * Web    : http://tmva.sourceforge.net                                           *

 *                                                                                *

 * Description:                                                                   *

 *      Implementation (see header for description)                               *

 *                                                                                *

 * Authors :                                                                      *

 *      Andreas Hoecker <Andreas.Hocker@cern.ch> - CERN, Switzerland              *

 *      Joerg Stelzer   <stelzer@cern.ch>        - DESY, Germany                  *

 *      Peter Speckmayer <peter.speckmayer@cern.ch> - CERN, Switzerland           *

 *      Jan Therhaag          <Jan.Therhaag@cern.ch>   - U of Bonn, Germany       *

 *      Eckhard v. Toerne     <evt@uni-bonn.de>        - U of Bonn, Germany       *

 *      Helge Voss      <Helge.Voss@cern.ch>     - MPI-K Heidelberg, Germany      *

 *      Kai Voss        <Kai.Voss@cern.ch>       - U. of Victoria, Canada         *

 *      Omar Zapata     <Omar.Zapata@cern.ch>    - UdeA/ITM Colombia              *

 *      Lorenzo Moneta  <Lorenzo.Moneta@cern.ch> - CERN, Switzerland              *

 *      Sergei Gleyzer  <Sergei.Gleyzer@cern.ch> - U of Florida & CERN            *

 *      Kim Albertsson  <kim.albertsson@cern.ch> - LTU & CERN                     *

 *                                                                                *

 * Copyright (c) 2005-2015:                                                       *

 *      CERN, Switzerland                                                         *

 *      U. of Victoria, Canada                                                    *

 *      MPI-K Heidelberg, Germany                                                 *

 *      U. of Bonn, Germany                                                       *

 *      UdeA/ITM, Colombia                                                        *

 *      U. of Florida, USA                                                        *

 *                                                                                *

 * Redistribution and use in source and binary forms, with or without             *

 * modification, are permitted according to the terms listed in LICENSE           *

 * (http://tmva.sourceforge.net/LICENSE)                                          *

 **********************************************************************************/


/*! \class TMVA::Factory

\ingroup TMVA


This is the main MVA steering class.

It creates all MVA methods, and guides them through the training, testing and

evaluation phases.

*/


#include "TMVA/Factory.h"


#include "TMVA/ClassifierFactory.h"

#include "TMVA/Config.h"

#include "TMVA/Configurable.h"

#include "TMVA/Tools.h"

#include "TMVA/Ranking.h"

#include "TMVA/DataSet.h"

#include "TMVA/IMethod.h"

#include "TMVA/MethodBase.h"

#include "TMVA/DataInputHandler.h"

#include "TMVA/DataSetManager.h"

#include "TMVA/DataSetInfo.h"

#include "TMVA/DataLoader.h"

#include "TMVA/MethodBoost.h"

#include "TMVA/MethodCategory.h"

#include "TMVA/ROCCalc.h"

#include "TMVA/ROCCurve.h"

#include "TMVA/MsgLogger.h"


#include "TMVA/VariableInfo.h"

#include "TMVA/VariableTransform.h"


#include "TMVA/Results.h"

#include "TMVA/ResultsClassification.h"

#include "TMVA/ResultsRegression.h"

#include "TMVA/ResultsMulticlass.h"

#include <list>

#include <bitset>


#include "TMVA/Types.h"


#include "TROOT.h"

#include "TFile.h"

#include "TTree.h"

#include "TLeaf.h"

#include "TEventList.h"

#include "TH2.h"

#include "TText.h"

#include "TLegend.h"

#include "TGraph.h"

#include "TStyle.h"

#include "TMatrixF.h"

#include "TMatrixDSym.h"

#include "TMultiGraph.h"

#include "TPaletteAxis.h"

#include "TPrincipal.h"

#include "TMath.h"

#include "TObjString.h"

#include "TSystem.h"

#include "TCanvas.h"


const Int_t  MinNoTrainingEvents = 10;

//const Int_t  MinNoTestEvents     = 1;


ClassImp(TMVA::Factory);


#define READXML          kTRUE


//number of bits for bitset

#define VIBITS          32


////////////////////////////////////////////////////////////////////////////////

/// Standard constructor.

///

///  - jobname       : this name will appear in all weight file names produced by the MVAs

///  - theTargetFile : output ROOT file; the test tree and all evaluation plots

///                   will be stored here

///  - theOption     : option string; currently: "V" for verbose


TMVA::Factory::Factory( TString jobName, TFile* theTargetFile, TString theOption )

: Configurable          ( theOption ),

   fTransformations      ( "I" ),

   fVerbose              ( kFALSE ),

   fVerboseLevel         ( kINFO ),

   fCorrelations         ( kFALSE ),

   fROC                  ( kTRUE ),

   fSilentFile           ( theTargetFile == nullptr ),

   fJobName              ( jobName ),

   fAnalysisType         ( Types::kClassification ),

   fModelPersistence     (kTRUE)

{

   fName = "Factory";

   fgTargetFile = theTargetFile;

   fLogger->SetSource(fName.Data());


   // render silent

   if (gTools().CheckForSilentOption( GetOptions() )) Log().InhibitOutput(); // make sure is silent if wanted to


   // init configurable

   SetConfigDescription( "Configuration options for Factory running" );

   SetConfigName( GetName() );


   // histograms are not automatically associated with the current

   // directory and hence don't go out of scope when closing the file

   // TH1::AddDirectory(kFALSE);

   Bool_t silent          = kFALSE;

#ifdef WIN32

   // under Windows, switch progress bar and color off by default, as the typical windows shell doesn't handle these (would need different sequences..)

   Bool_t color           = kFALSE;

   Bool_t drawProgressBar = kFALSE;

#else

   Bool_t color           = !gROOT->IsBatch();

   Bool_t drawProgressBar = kTRUE;

#endif

   DeclareOptionRef( fVerbose, "V", "Verbose flag" );

   DeclareOptionRef( fVerboseLevel=TString("Info"), "VerboseLevel", "VerboseLevel (Debug/Verbose/Info)" );

   AddPreDefVal(TString("Debug"));

   AddPreDefVal(TString("Verbose"));

   AddPreDefVal(TString("Info"));

   DeclareOptionRef( color,    "Color", "Flag for coloured screen output (default: True, if in batch mode: False)" );

   DeclareOptionRef( fTransformations, "Transformations", "List of transformations to test; formatting example: \"Transformations=I;D;P;U;G,D\", for identity, decorrelation, PCA, Uniform and Gaussianisation followed by decorrelation transformations" );

   DeclareOptionRef( fCorrelations, "Correlations", "boolean to show correlation in output" );

   DeclareOptionRef( fROC, "ROC", "boolean to show ROC in output" );

   DeclareOptionRef( silent,   "Silent", "Batch mode: boolean silent flag inhibiting any output from TMVA after the creation of the factory class object (default: False)" );

   DeclareOptionRef( drawProgressBar,

                     "DrawProgressBar", "Draw progress bar to display training, testing and evaluation schedule (default: True)" );

   DeclareOptionRef( fModelPersistence,

                     "ModelPersistence",

                     "Option to save the trained model in xml file or using serialization");


   TString analysisType("Auto");

   DeclareOptionRef( analysisType,

                     "AnalysisType", "Set the analysis type (Classification, Regression, Multiclass, Auto) (default: Auto)" );

   AddPreDefVal(TString("Classification"));

   AddPreDefVal(TString("Regression"));

   AddPreDefVal(TString("Multiclass"));

   AddPreDefVal(TString("Auto"));


   ParseOptions();

   CheckForUnusedOptions();


   if (Verbose()) fLogger->SetMinType( kVERBOSE );

   if (fVerboseLevel.CompareTo("Debug")   ==0) fLogger->SetMinType( kDEBUG );

   if (fVerboseLevel.CompareTo("Verbose") ==0) fLogger->SetMinType( kVERBOSE );

   if (fVerboseLevel.CompareTo("Info")    ==0) fLogger->SetMinType( kINFO );


   // global settings

   gConfig().SetUseColor( color );

   gConfig().SetSilent( silent );

   gConfig().SetDrawProgressBar( drawProgressBar );


   analysisType.ToLower();

   if     ( analysisType == "classification" ) fAnalysisType = Types::kClassification;

   else if( analysisType == "regression" )     fAnalysisType = Types::kRegression;

   else if( analysisType == "multiclass" )     fAnalysisType = Types::kMulticlass;

   else if( analysisType == "auto" )           fAnalysisType = Types::kNoAnalysisType;


//   Greetings();

}


////////////////////////////////////////////////////////////////////////////////

/// Constructor.


TMVA::Factory::Factory( TString jobName, TString theOption )

: Configurable          ( theOption ),

   fTransformations      ( "I" ),

   fVerbose              ( kFALSE ),

   fCorrelations         ( kFALSE ),

   fROC                  ( kTRUE ),

   fSilentFile           ( kTRUE ),

   fJobName              ( jobName ),

   fAnalysisType         ( Types::kClassification ),

   fModelPersistence     (kTRUE)

{

   fName = "Factory";

   fgTargetFile = nullptr;

   fLogger->SetSource(fName.Data());


   // render silent

   if (gTools().CheckForSilentOption( GetOptions() )) Log().InhibitOutput(); // make sure is silent if wanted to


   // init configurable

   SetConfigDescription( "Configuration options for Factory running" );

   SetConfigName( GetName() );


   // histograms are not automatically associated with the current

   // directory and hence don't go out of scope when closing the file

   TH1::AddDirectory(kFALSE);

   Bool_t silent          = kFALSE;

#ifdef WIN32

   // under Windows, switch progress bar and color off by default, as the typical windows shell doesn't handle these (would need different sequences..)

   Bool_t color           = kFALSE;

   Bool_t drawProgressBar = kFALSE;

#else

   Bool_t color           = !gROOT->IsBatch();

   Bool_t drawProgressBar = kTRUE;

#endif

   DeclareOptionRef( fVerbose, "V", "Verbose flag" );

   DeclareOptionRef( fVerboseLevel=TString("Info"), "VerboseLevel", "VerboseLevel (Debug/Verbose/Info)" );

   AddPreDefVal(TString("Debug"));

   AddPreDefVal(TString("Verbose"));

   AddPreDefVal(TString("Info"));

   DeclareOptionRef( color,    "Color", "Flag for coloured screen output (default: True, if in batch mode: False)" );

   DeclareOptionRef( fTransformations, "Transformations", "List of transformations to test; formatting example: \"Transformations=I;D;P;U;G,D\", for identity, decorrelation, PCA, Uniform and Gaussianisation followed by decorrelation transformations" );

   DeclareOptionRef( fCorrelations, "Correlations", "boolean to show correlation in output" );

   DeclareOptionRef( fROC, "ROC", "boolean to show ROC in output" );

   DeclareOptionRef( silent,   "Silent", "Batch mode: boolean silent flag inhibiting any output from TMVA after the creation of the factory class object (default: False)" );

   DeclareOptionRef( drawProgressBar,

                     "DrawProgressBar", "Draw progress bar to display training, testing and evaluation schedule (default: True)" );

   DeclareOptionRef( fModelPersistence,

                     "ModelPersistence",

                     "Option to save the trained model in xml file or using serialization");


   TString analysisType("Auto");

   DeclareOptionRef( analysisType,

                     "AnalysisType", "Set the analysis type (Classification, Regression, Multiclass, Auto) (default: Auto)" );

   AddPreDefVal(TString("Classification"));

   AddPreDefVal(TString("Regression"));

   AddPreDefVal(TString("Multiclass"));

   AddPreDefVal(TString("Auto"));


   ParseOptions();

   CheckForUnusedOptions();


   if (Verbose()) fLogger->SetMinType( kVERBOSE );

   if (fVerboseLevel.CompareTo("Debug")   ==0) fLogger->SetMinType( kDEBUG );

   if (fVerboseLevel.CompareTo("Verbose") ==0) fLogger->SetMinType( kVERBOSE );

   if (fVerboseLevel.CompareTo("Info")    ==0) fLogger->SetMinType( kINFO );


   // global settings

   gConfig().SetUseColor( color );

   gConfig().SetSilent( silent );

   gConfig().SetDrawProgressBar( drawProgressBar );


   analysisType.ToLower();

   if     ( analysisType == "classification" ) fAnalysisType = Types::kClassification;

   else if( analysisType == "regression" )     fAnalysisType = Types::kRegression;

   else if( analysisType == "multiclass" )     fAnalysisType = Types::kMulticlass;

   else if( analysisType == "auto" )           fAnalysisType = Types::kNoAnalysisType;


   Greetings();

}


////////////////////////////////////////////////////////////////////////////////

/// Print welcome message.

/// Options are: kLogoWelcomeMsg, kIsometricWelcomeMsg, kLeanWelcomeMsg


void TMVA::Factory::Greetings()

{

   gTools().ROOTVersionMessage( Log() );

   gTools().TMVAWelcomeMessage( Log(), gTools().kLogoWelcomeMsg );

   gTools().TMVAVersionMessage( Log() ); Log() << Endl;

}


////////////////////////////////////////////////////////////////////////////////

/// Destructor.


TMVA::Factory::~Factory( void )

{

   std::vector<TMVA::VariableTransformBase*>::iterator trfIt = fDefaultTrfs.begin();

   for (;trfIt != fDefaultTrfs.end(); ++trfIt) delete (*trfIt);


   this->DeleteAllMethods();


   // problem with call of REGISTER_METHOD macro ...

   //   ClassifierFactory::DestroyInstance();

   //   Types::DestroyInstance();

   //Tools::DestroyInstance();

   //Config::DestroyInstance();

}


////////////////////////////////////////////////////////////////////////////////

/// Delete methods.


void TMVA::Factory::DeleteAllMethods( void )

{

   std::map<TString,MVector*>::iterator itrMap;


   for(itrMap = fMethodsMap.begin();itrMap != fMethodsMap.end();++itrMap)

   {

      MVector *methods=itrMap->second;

      // delete methods

      MVector::iterator itrMethod = methods->begin();

      for (; itrMethod != methods->end(); ++itrMethod) {

     Log() << kDEBUG << "Delete method: " << (*itrMethod)->GetName() << Endl;

     delete (*itrMethod);

      }

      methods->clear();

      delete methods;

   }

}


////////////////////////////////////////////////////////////////////////////////


void TMVA::Factory::SetVerbose( Bool_t v )

{

   fVerbose = v;

}


////////////////////////////////////////////////////////////////////////////////

/// Book a classifier or regression method.


TMVA::MethodBase* TMVA::Factory::BookMethod( TMVA::DataLoader *loader, TString theMethodName, TString methodTitle, TString theOption )

{

   if(fModelPersistence) gSystem->MakeDirectory(loader->GetName());//creating directory for DataLoader output


   TString datasetname=loader->GetName();


   if( fAnalysisType == Types::kNoAnalysisType ){

      if( loader->GetDataSetInfo().GetNClasses()==2

          && loader->GetDataSetInfo().GetClassInfo("Signal") != NULL

          && loader->GetDataSetInfo().GetClassInfo("Background") != NULL

          ){

         fAnalysisType = Types::kClassification; // default is classification

      } else if( loader->GetDataSetInfo().GetNClasses() >= 2 ){

         fAnalysisType = Types::kMulticlass;    // if two classes, but not named "Signal" and "Background"

      } else

         Log() << kFATAL << "No analysis type for " << loader->GetDataSetInfo().GetNClasses() << " classes and "

               << loader->GetDataSetInfo().GetNTargets() << " regression targets." << Endl;

   }


   // booking via name; the names are translated into enums and the

   // corresponding overloaded BookMethod is called


  if(fMethodsMap.find(datasetname)!=fMethodsMap.end())

   {

      if (GetMethod( datasetname,methodTitle ) != 0) {

       Log() << kFATAL << "Booking failed since method with title <"

        << methodTitle <<"> already exists "<< "in with DataSet Name <"<< loader->GetName()<<">  "

        << Endl;

     }

   }


     Log() << kHEADER << "Booking method: " << gTools().Color("bold") << methodTitle

     // << gTools().Color("reset")<<" DataSet Name: "<<gTools().Color("bold")<<loader->GetName()

      << gTools().Color("reset") << Endl << Endl;


   // interpret option string with respect to a request for boosting (i.e., BostNum > 0)

   Int_t    boostNum = 0;

   TMVA::Configurable* conf = new TMVA::Configurable( theOption );

   conf->DeclareOptionRef( boostNum = 0, "Boost_num",

                           "Number of times the classifier will be boosted" );

   conf->ParseOptions();

   delete conf;

   // this is name of weight file directory

   TString fileDir;

   if(fModelPersistence)

   {

      // find prefix in fWeightFileDir;

      TString prefix = gConfig().GetIONames().fWeightFileDirPrefix;

      fileDir = prefix;

      if (!prefix.IsNull())

         if (fileDir[fileDir.Length()-1] != '/') fileDir += "/";

      fileDir += loader->GetName();

      fileDir += "/" + gConfig().GetIONames().fWeightFileDir;

   }

   // initialize methods

   IMethod* im;

   if (!boostNum) {

      im = ClassifierFactory::Instance().Create(theMethodName.Data(), fJobName, methodTitle,

                                                loader->GetDataSetInfo(), theOption);

   }

   else {

      // boosted classifier, requires a specific definition, making it transparent for the user

     Log() << kDEBUG <<"Boost Number is " << boostNum << " > 0: train boosted classifier" << Endl;

     im = ClassifierFactory::Instance().Create("Boost", fJobName, methodTitle, loader->GetDataSetInfo(), theOption);

     MethodBoost *methBoost = dynamic_cast<MethodBoost *>(im); // DSMTEST divided into two lines

     if (!methBoost) {                                    // DSMTEST

        Log() << kFATAL << "Method with type kBoost cannot be casted to MethodCategory. /Factory" << Endl; // DSMTEST

        return nullptr;

     }

     if (fModelPersistence)  methBoost->SetWeightFileDir(fileDir);

     methBoost->SetModelPersistence(fModelPersistence);

     methBoost->SetBoostedMethodName(theMethodName);                            // DSMTEST divided into two lines

     methBoost->fDataSetManager = loader->GetDataSetInfo().GetDataSetManager(); // DSMTEST

     methBoost->SetFile(fgTargetFile);

     methBoost->SetSilentFile(IsSilentFile());

   }


   MethodBase *method = dynamic_cast<MethodBase*>(im);

   if (method==0) return 0; // could not create method


   // set fDataSetManager if MethodCategory (to enable Category to create datasetinfo objects) // DSMTEST

   if (method->GetMethodType() == Types::kCategory) { // DSMTEST

      MethodCategory *methCat = (dynamic_cast<MethodCategory*>(im)); // DSMTEST

      if (!methCat) {// DSMTEST

         Log() << kFATAL << "Method with type kCategory cannot be casted to MethodCategory. /Factory" << Endl; // DSMTEST

         return nullptr;

      }

      if(fModelPersistence) methCat->SetWeightFileDir(fileDir);

      methCat->SetModelPersistence(fModelPersistence);

      methCat->fDataSetManager = loader->GetDataSetInfo().GetDataSetManager(); // DSMTEST

      methCat->SetFile(fgTargetFile);

      methCat->SetSilentFile(IsSilentFile());

   } // DSMTEST


   if (!method->HasAnalysisType( fAnalysisType,

                                 loader->GetDataSetInfo().GetNClasses(),

                                 loader->GetDataSetInfo().GetNTargets() )) {

      Log() << kWARNING << "Method " << method->GetMethodTypeName() << " is not capable of handling " ;

      if (fAnalysisType == Types::kRegression) {

         Log() << "regression with " << loader->GetDataSetInfo().GetNTargets() << " targets." << Endl;

      }

      else if (fAnalysisType == Types::kMulticlass ) {

         Log() << "multiclass classification with " << loader->GetDataSetInfo().GetNClasses() << " classes." << Endl;

      }

      else {

         Log() << "classification with " << loader->GetDataSetInfo().GetNClasses() << " classes." << Endl;

      }

      return 0;

   }


   if(fModelPersistence) method->SetWeightFileDir(fileDir);

   method->SetModelPersistence(fModelPersistence);

   method->SetAnalysisType( fAnalysisType );

   method->SetupMethod();

   method->ParseOptions();

   method->ProcessSetup();

   method->SetFile(fgTargetFile);

   method->SetSilentFile(IsSilentFile());


   // check-for-unused-options is performed; may be overridden by derived classes

   method->CheckSetup();


   if(fMethodsMap.find(datasetname)==fMethodsMap.end())

   {

   MVector *mvector=new MVector;

   fMethodsMap[datasetname]=mvector;

   }

   fMethodsMap[datasetname]->push_back( method );

   return method;

}


////////////////////////////////////////////////////////////////////////////////

/// Books MVA method. The option configuration string is custom for each MVA

/// the TString field "theNameAppendix" serves to define (and distinguish)

/// several instances of a given MVA, eg, when one wants to compare the

/// performance of various configurations


TMVA::MethodBase* TMVA::Factory::BookMethod(TMVA::DataLoader *loader, Types::EMVA theMethod, TString methodTitle, TString theOption )

{

   return BookMethod(loader, Types::Instance().GetMethodName( theMethod ), methodTitle, theOption );

}


////////////////////////////////////////////////////////////////////////////////

/// Adds an already constructed method to be managed by this factory.

///

/// \note Private.

/// \note Know what you are doing when using this method. The method that you

/// are loading could be trained already.

///


TMVA::MethodBase* TMVA::Factory::BookMethodWeightfile(DataLoader *loader, TMVA::Types::EMVA methodType, const TString &weightfile)

{

   TString datasetname = loader->GetName();

   std::string methodTypeName = std::string(Types::Instance().GetMethodName(methodType).Data());

   DataSetInfo &dsi = loader->GetDataSetInfo();


   IMethod *im = ClassifierFactory::Instance().Create(methodTypeName, dsi, weightfile );

   MethodBase *method = (dynamic_cast<MethodBase*>(im));


   if (method == nullptr) return nullptr;


   if( method->GetMethodType() == Types::kCategory ){

      Log() << kERROR << "Cannot handle category methods for now." << Endl;

   }


   TString fileDir;

   if(fModelPersistence) {

      // find prefix in fWeightFileDir;

      TString prefix = gConfig().GetIONames().fWeightFileDirPrefix;

      fileDir = prefix;

      if (!prefix.IsNull())

         if (fileDir[fileDir.Length() - 1] != '/')

            fileDir += "/";

      fileDir=loader->GetName();

      fileDir+="/"+gConfig().GetIONames().fWeightFileDir;

   }


   if(fModelPersistence) method->SetWeightFileDir(fileDir);

   method->SetModelPersistence(fModelPersistence);

   method->SetAnalysisType( fAnalysisType );

   method->SetupMethod();

   method->SetFile(fgTargetFile);

   method->SetSilentFile(IsSilentFile());


   method->DeclareCompatibilityOptions();


   // read weight file

   method->ReadStateFromFile();


   //method->CheckSetup();


   TString methodTitle = method->GetName();

   if (HasMethod(datasetname, methodTitle) != 0) {

    Log() << kFATAL << "Booking failed since method with title <"

     << methodTitle <<"> already exists "<< "in with DataSet Name <"<< loader->GetName()<<">  "

     << Endl;

   }


   Log() << kINFO << "Booked classifier \"" << method->GetMethodName()

         << "\" of type: \"" << method->GetMethodTypeName() << "\"" << Endl;


   if(fMethodsMap.count(datasetname) == 0) {

      MVector *mvector = new MVector;

      fMethodsMap[datasetname] = mvector;

   }


   fMethodsMap[datasetname]->push_back( method );


   return method;

}


////////////////////////////////////////////////////////////////////////////////

/// Returns pointer to MVA that corresponds to given method title.


TMVA::IMethod* TMVA::Factory::GetMethod(const TString& datasetname,  const TString &methodTitle ) const

{

   if(fMethodsMap.find(datasetname)==fMethodsMap.end()) return 0;


   MVector *methods=fMethodsMap.find(datasetname)->second;


   MVector::const_iterator itrMethod;

   //

   for (itrMethod    = methods->begin(); itrMethod != methods->end(); ++itrMethod) {

      MethodBase* mva = dynamic_cast<MethodBase*>(*itrMethod);

      if ( (mva->GetMethodName())==methodTitle ) return mva;

   }

   return 0;

}


////////////////////////////////////////////////////////////////////////////////

/// Checks whether a given method name is defined for a given dataset.


Bool_t TMVA::Factory::HasMethod(const TString& datasetname,  const TString &methodTitle ) const

{

   if(fMethodsMap.find(datasetname)==fMethodsMap.end()) return 0;


   std::string methodName = methodTitle.Data();

   auto isEqualToMethodName = [&methodName](TMVA::IMethod * m) {

      return ( 0 == methodName.compare( m->GetName() ) );

   };


   TMVA::Factory::MVector * methods = this->fMethodsMap.at(datasetname);

   Bool_t isMethodNameExisting = std::any_of( methods->begin(), methods->end(), isEqualToMethodName);


   return isMethodNameExisting;

}


////////////////////////////////////////////////////////////////////////////////


void TMVA::Factory::WriteDataInformation(DataSetInfo&     fDataSetInfo)

{

   RootBaseDir()->cd();


   if(!RootBaseDir()->GetDirectory(fDataSetInfo.GetName())) RootBaseDir()->mkdir(fDataSetInfo.GetName());

   else return; //loader is now in the output file, we dont need to save again


   RootBaseDir()->cd(fDataSetInfo.GetName());

   fDataSetInfo.GetDataSet(); // builds dataset (including calculation of correlation matrix)


   // correlation matrix of the default DS

   const TMatrixD* m(0);

   const TH2* h(0);


   if(fAnalysisType == Types::kMulticlass){

      for (UInt_t cls = 0; cls < fDataSetInfo.GetNClasses() ; cls++) {

         m = fDataSetInfo.CorrelationMatrix(fDataSetInfo.GetClassInfo(cls)->GetName());

         h = fDataSetInfo.CreateCorrelationMatrixHist(m, TString("CorrelationMatrix")+fDataSetInfo.GetClassInfo(cls)->GetName(),

                                                              TString("Correlation Matrix (")+ fDataSetInfo.GetClassInfo(cls)->GetName() +TString(")"));

         if (h!=0) {

            h->Write();

            delete h;

         }

      }

   }

   else{

      m = fDataSetInfo.CorrelationMatrix( "Signal" );

      h = fDataSetInfo.CreateCorrelationMatrixHist(m, "CorrelationMatrixS", "Correlation Matrix (signal)");

      if (h!=0) {

         h->Write();

         delete h;

      }


      m = fDataSetInfo.CorrelationMatrix( "Background" );

      h = fDataSetInfo.CreateCorrelationMatrixHist(m, "CorrelationMatrixB", "Correlation Matrix (background)");

      if (h!=0) {

         h->Write();

         delete h;

      }


      m = fDataSetInfo.CorrelationMatrix( "Regression" );

      h = fDataSetInfo.CreateCorrelationMatrixHist(m, "CorrelationMatrix", "Correlation Matrix");

      if (h!=0) {

         h->Write();

         delete h;

      }

   }


   // some default transformations to evaluate

   // NOTE: all transformations are destroyed after this test

   TString processTrfs = "I"; //"I;N;D;P;U;G,D;"


   // plus some user defined transformations

   processTrfs = fTransformations;


   // remove any trace of identity transform - if given (avoid to apply it twice)

   std::vector<TMVA::TransformationHandler*> trfs;

   TransformationHandler* identityTrHandler = 0;


   std::vector<TString> trfsDef = gTools().SplitString(processTrfs,';');

   std::vector<TString>::iterator trfsDefIt = trfsDef.begin();

   for (; trfsDefIt!=trfsDef.end(); ++trfsDefIt) {

      trfs.push_back(new TMVA::TransformationHandler(fDataSetInfo, "Factory"));

      TString trfS = (*trfsDefIt);


      //Log() << kINFO << Endl;

      Log() << kDEBUG << "current transformation string: '" << trfS.Data() << "'" << Endl;

      TMVA::CreateVariableTransforms( trfS,

                                                  fDataSetInfo,

                                                  *(trfs.back()),

                                                  Log() );


      if (trfS.BeginsWith('I')) identityTrHandler = trfs.back();

   }


   const std::vector<Event*>& inputEvents = fDataSetInfo.GetDataSet()->GetEventCollection();


   // apply all transformations

   std::vector<TMVA::TransformationHandler*>::iterator trfIt = trfs.begin();


   for (;trfIt != trfs.end(); ++trfIt) {

      // setting a Root dir causes the variables distributions to be saved to the root file

      (*trfIt)->SetRootDir(RootBaseDir()->GetDirectory(fDataSetInfo.GetName()));// every dataloader have its own dir

      (*trfIt)->CalcTransformations(inputEvents);

   }

   if(identityTrHandler) identityTrHandler->PrintVariableRanking();


   // clean up

   for (trfIt = trfs.begin(); trfIt != trfs.end(); ++trfIt) delete *trfIt;

}


////////////////////////////////////////////////////////////////////////////////

/// Iterates through all booked methods and sees if they use parameter tuning and if so..

/// does just that  i.e. calls "Method::Train()" for different parameter settings and

/// keeps in mind the "optimal one"... and that's the one that will later on be used

/// in the main training loop.


std::map<TString,Double_t> TMVA::Factory::OptimizeAllMethods(TString fomType, TString fitType)

{


   std::map<TString,MVector*>::iterator itrMap;

   std::map<TString,Double_t> TunedParameters;

   for(itrMap = fMethodsMap.begin();itrMap != fMethodsMap.end();++itrMap)

   {

      MVector *methods=itrMap->second;


      MVector::iterator itrMethod;


      // iterate over methods and optimize

      for( itrMethod = methods->begin(); itrMethod != methods->end(); ++itrMethod ) {

     Event::SetIsTraining(kTRUE);

     MethodBase* mva = dynamic_cast<MethodBase*>(*itrMethod);

     if (!mva) {

       Log() << kFATAL << "Dynamic cast to MethodBase failed" <<Endl;

       return TunedParameters;

     }


     if (mva->Data()->GetNTrainingEvents() < MinNoTrainingEvents) {

       Log() << kWARNING << "Method " << mva->GetMethodName()

        << " not trained (training tree has less entries ["

        << mva->Data()->GetNTrainingEvents()

        << "] than required [" << MinNoTrainingEvents << "]" << Endl;

       continue;

     }


     Log() << kINFO << "Optimize method: " << mva->GetMethodName() << " for "

      << (fAnalysisType == Types::kRegression ? "Regression" :

          (fAnalysisType == Types::kMulticlass ? "Multiclass classification" : "Classification")) << Endl;


     TunedParameters = mva->OptimizeTuningParameters(fomType,fitType);

     Log() << kINFO << "Optimization of tuning parameters finished for Method:"<<mva->GetName() << Endl;

      }

   }


   return TunedParameters;


}


////////////////////////////////////////////////////////////////////////////////

/// Private method to generate a ROCCurve instance for a given method.

/// Handles the conversion from TMVA ResultSet to a format the ROCCurve class

/// understands.

///

/// \note You own the retured pointer.

///


TMVA::ROCCurve *TMVA::Factory::GetROC(TMVA::DataLoader *loader, TString theMethodName, UInt_t iClass,

                                      Types::ETreeType type)

{

   return GetROC((TString)loader->GetName(), theMethodName, iClass, type);

}


////////////////////////////////////////////////////////////////////////////////

/// Private method to generate a ROCCurve instance for a given method.

/// Handles the conversion from TMVA ResultSet to a format the ROCCurve class

/// understands.

///

/// \note You own the retured pointer.

///


TMVA::ROCCurve *TMVA::Factory::GetROC(TString datasetname, TString theMethodName, UInt_t iClass, Types::ETreeType type)

{

   if (fMethodsMap.find(datasetname) == fMethodsMap.end()) {

      Log() << kERROR << Form("DataSet = %s not found in methods map.", datasetname.Data()) << Endl;

      return nullptr;

   }


   if (!this->HasMethod(datasetname, theMethodName)) {

      Log() << kERROR << Form("Method = %s not found with Dataset = %s ", theMethodName.Data(), datasetname.Data())

            << Endl;

      return nullptr;

   }


   std::set<Types::EAnalysisType> allowedAnalysisTypes = {Types::kClassification, Types::kMulticlass};

   if (allowedAnalysisTypes.count(this->fAnalysisType) == 0) {

      Log() << kERROR << Form("Can only generate ROC curves for analysis type kClassification and kMulticlass.")

            << Endl;

      return nullptr;

   }


   TMVA::MethodBase *method = dynamic_cast<TMVA::MethodBase *>(this->GetMethod(datasetname, theMethodName));

   TMVA::DataSet *dataset = method->Data();

   dataset->SetCurrentType(type);

   TMVA::Results *results = dataset->GetResults(theMethodName, type, this->fAnalysisType);


   UInt_t nClasses = method->DataInfo().GetNClasses();

   if (this->fAnalysisType == Types::kMulticlass && iClass >= nClasses) {

      Log() << kERROR << Form("Given class number (iClass = %i) does not exist. There are %i classes in dataset.",

                              iClass, nClasses)

            << Endl;

      return nullptr;

   }


   TMVA::ROCCurve *rocCurve = nullptr;

   if (this->fAnalysisType == Types::kClassification) {


      std::vector<Float_t> *mvaRes = dynamic_cast<ResultsClassification *>(results)->GetValueVector();

      std::vector<Bool_t> *mvaResTypes = dynamic_cast<ResultsClassification *>(results)->GetValueVectorTypes();

      std::vector<Float_t> mvaResWeights;


      auto eventCollection = dataset->GetEventCollection(type);

      mvaResWeights.reserve(eventCollection.size());

      for (auto ev : eventCollection) {

         mvaResWeights.push_back(ev->GetWeight());

      }


      rocCurve = new TMVA::ROCCurve(*mvaRes, *mvaResTypes, mvaResWeights);


   } else if (this->fAnalysisType == Types::kMulticlass) {

      std::vector<Float_t> mvaRes;

      std::vector<Bool_t> mvaResTypes;

      std::vector<Float_t> mvaResWeights;


      std::vector<std::vector<Float_t>> *rawMvaRes = dynamic_cast<ResultsMulticlass *>(results)->GetValueVector();


      // Vector transpose due to values being stored as

      //    [ [0, 1, 2], [0, 1, 2], ... ]

      // in ResultsMulticlass::GetValueVector.

      mvaRes.reserve(rawMvaRes->size());

      for (auto item : *rawMvaRes) {

         mvaRes.push_back(item[iClass]);

      }


      auto eventCollection = dataset->GetEventCollection(type);

      mvaResTypes.reserve(eventCollection.size());

      mvaResWeights.reserve(eventCollection.size());

      for (auto ev : eventCollection) {

         mvaResTypes.push_back(ev->GetClass() == iClass);

         mvaResWeights.push_back(ev->GetWeight());

      }


      rocCurve = new TMVA::ROCCurve(mvaRes, mvaResTypes, mvaResWeights);

   }


   return rocCurve;

}


////////////////////////////////////////////////////////////////////////////////

/// Calculate the integral of the ROC curve, also known as the area under curve

/// (AUC), for a given method.

///

/// Argument iClass specifies the class to generate the ROC curve in a

/// multiclass setting. It is ignored for binary classification.

///


Double_t TMVA::Factory::GetROCIntegral(TMVA::DataLoader *loader, TString theMethodName, UInt_t iClass)

{

   return GetROCIntegral((TString)loader->GetName(), theMethodName, iClass);

}


////////////////////////////////////////////////////////////////////////////////

/// Calculate the integral of the ROC curve, also known as the area under curve

/// (AUC), for a given method.

///

/// Argument iClass specifies the class to generate the ROC curve in a

/// multiclass setting. It is ignored for binary classification.

///


Double_t TMVA::Factory::GetROCIntegral(TString datasetname, TString theMethodName, UInt_t iClass)

{

   if (fMethodsMap.find(datasetname) == fMethodsMap.end()) {

      Log() << kERROR << Form("DataSet = %s not found in methods map.", datasetname.Data()) << Endl;

      return 0;

   }


   if ( ! this->HasMethod(datasetname, theMethodName) ) {

      Log() << kERROR << Form("Method = %s not found with Dataset = %s ", theMethodName.Data(), datasetname.Data()) << Endl;

      return 0;

   }


   std::set<Types::EAnalysisType> allowedAnalysisTypes = {Types::kClassification, Types::kMulticlass};

   if ( allowedAnalysisTypes.count(this->fAnalysisType) == 0 ) {

      Log() << kERROR << Form("Can only generate ROC integral for analysis type kClassification. and kMulticlass.")

            << Endl;

      return 0;

   }


   TMVA::ROCCurve *rocCurve = GetROC(datasetname, theMethodName, iClass);

   if (!rocCurve) {

      Log() << kFATAL << Form("ROCCurve object was not created in Method = %s not found with Dataset = %s ",

                              theMethodName.Data(), datasetname.Data())

            << Endl;

      return 0;

   }


   Int_t npoints = TMVA::gConfig().fVariablePlotting.fNbinsXOfROCCurve + 1;

   Double_t rocIntegral = rocCurve->GetROCIntegral(npoints);

   delete rocCurve;


   return rocIntegral;

}


////////////////////////////////////////////////////////////////////////////////

/// Argument iClass specifies the class to generate the ROC curve in a

/// multiclass setting. It is ignored for binary classification.

///

/// Returns a ROC graph for a given method, or nullptr on error.

///

/// Note: Evaluation of the given method must have been run prior to ROC

/// generation through Factory::EvaluateAllMetods.

///

/// NOTE: The ROC curve is 1 vs. all where the given class is considered signal

/// and the others considered background. This is ok in binary classification

/// but in in multi class classification, the ROC surface is an N dimensional

/// shape, where N is number of classes - 1.


TGraph* TMVA::Factory::GetROCCurve(DataLoader *loader, TString theMethodName, Bool_t setTitles, UInt_t iClass)

{

  return GetROCCurve( (TString)loader->GetName(), theMethodName, setTitles, iClass );

}


////////////////////////////////////////////////////////////////////////////////

/// Argument iClass specifies the class to generate the ROC curve in a

/// multiclass setting. It is ignored for binary classification.

///

/// Returns a ROC graph for a given method, or nullptr on error.

///

/// Note: Evaluation of the given method must have been run prior to ROC

/// generation through Factory::EvaluateAllMetods.

///

/// NOTE: The ROC curve is 1 vs. all where the given class is considered signal

/// and the others considered background. This is ok in binary classification

/// but in in multi class classification, the ROC surface is an N dimensional

/// shape, where N is number of classes - 1.


TGraph* TMVA::Factory::GetROCCurve(TString datasetname, TString theMethodName, Bool_t setTitles, UInt_t iClass)

{

   if (fMethodsMap.find(datasetname) == fMethodsMap.end()) {

      Log() << kERROR << Form("DataSet = %s not found in methods map.", datasetname.Data()) << Endl;

      return nullptr;

   }


   if ( ! this->HasMethod(datasetname, theMethodName) ) {

      Log() << kERROR << Form("Method = %s not found with Dataset = %s ", theMethodName.Data(), datasetname.Data()) << Endl;

      return nullptr;

   }


   std::set<Types::EAnalysisType> allowedAnalysisTypes = {Types::kClassification, Types::kMulticlass};

   if ( allowedAnalysisTypes.count(this->fAnalysisType) == 0 ) {

      Log() << kERROR << Form("Can only generate ROC curves for analysis type kClassification and kMulticlass.") << Endl;

      return nullptr;

   }


   TMVA::ROCCurve *rocCurve = GetROC(datasetname, theMethodName, iClass);

   TGraph *graph = nullptr;


   if ( ! rocCurve ) {

      Log() << kFATAL << Form("ROCCurve object was not created in Method = %s not found with Dataset = %s ", theMethodName.Data(), datasetname.Data()) << Endl;

      return nullptr;

   }


   graph    = (TGraph *)rocCurve->GetROCCurve()->Clone();

   delete rocCurve;


   if(setTitles) {

      graph->GetYaxis()->SetTitle("Background rejection (Specificity)");

      graph->GetXaxis()->SetTitle("Signal efficiency (Sensitivity)");

      graph->SetTitle(Form("Signal efficiency vs. Background rejection (%s)", theMethodName.Data()));

   }


   return graph;

}


////////////////////////////////////////////////////////////////////////////////

/// Generate a collection of graphs, for all methods for a given class. Suitable

/// for comparing method performance.

///

/// Argument iClass specifies the class to generate the ROC curve in a

/// multiclass setting. It is ignored for binary classification.

///

/// NOTE: The ROC curve is 1 vs. all where the given class is considered signal

/// and the others considered background. This is ok in binary classification

/// but in in multi class classification, the ROC surface is an N dimensional

/// shape, where N is number of classes - 1.


TMultiGraph* TMVA::Factory::GetROCCurveAsMultiGraph(DataLoader *loader, UInt_t iClass)

{

   return GetROCCurveAsMultiGraph((TString)loader->GetName(), iClass);

}


////////////////////////////////////////////////////////////////////////////////

/// Generate a collection of graphs, for all methods for a given class. Suitable

/// for comparing method performance.

///

/// Argument iClass specifies the class to generate the ROC curve in a

/// multiclass setting. It is ignored for binary classification.

///

/// NOTE: The ROC curve is 1 vs. all where the given class is considered signal

/// and the others considered background. This is ok in binary classification

/// but in in multi class classification, the ROC surface is an N dimensional

/// shape, where N is number of classes - 1.


TMultiGraph* TMVA::Factory::GetROCCurveAsMultiGraph(TString datasetname, UInt_t iClass)

{

   UInt_t line_color = 1;


   TMultiGraph *multigraph = new TMultiGraph();


   MVector *methods = fMethodsMap[datasetname.Data()];

   for (auto * method_raw : *methods) {

      TMVA::MethodBase *method = dynamic_cast<TMVA::MethodBase *>(method_raw);

      if (method == nullptr) { continue; }


      TString methodName = method->GetMethodName();

      UInt_t nClasses = method->DataInfo().GetNClasses();


      if ( this->fAnalysisType == Types::kMulticlass && iClass >= nClasses ) {

         Log() << kERROR << Form("Given class number (iClass = %i) does not exist. There are %i classes in dataset.", iClass, nClasses) << Endl;

         continue;

      }


      TString className = method->DataInfo().GetClassInfo(iClass)->GetName();


      TGraph *graph = this->GetROCCurve(datasetname, methodName, false, iClass);

      graph->SetTitle(methodName);


      graph->SetLineWidth(2);

      graph->SetLineColor(line_color++);

      graph->SetFillColor(10);


      multigraph->Add(graph);

   }


   if ( multigraph->GetListOfGraphs() == nullptr ) {

      Log() << kERROR << Form("No metohds have class %i defined.", iClass) << Endl;

      return nullptr;

   }


   return multigraph;

}


////////////////////////////////////////////////////////////////////////////////

/// Draws ROC curves for all methods booked with the factory for a given class

/// onto a canvas.

///

/// Argument iClass specifies the class to generate the ROC curve in a

/// multiclass setting. It is ignored for binary classification.

///

/// NOTE: The ROC curve is 1 vs. all where the given class is considered signal

/// and the others considered background. This is ok in binary classification

/// but in in multi class classification, the ROC surface is an N dimensional

/// shape, where N is number of classes - 1.


TCanvas * TMVA::Factory::GetROCCurve(TMVA::DataLoader *loader, UInt_t iClass)

{

   return GetROCCurve((TString)loader->GetName(), iClass);

}


////////////////////////////////////////////////////////////////////////////////

/// Draws ROC curves for all methods booked with the factory for a given class.

///

/// Argument iClass specifies the class to generate the ROC curve in a

/// multiclass setting. It is ignored for binary classification.

///

/// NOTE: The ROC curve is 1 vs. all where the given class is considered signal

/// and the others considered background. This is ok in binary classification

/// but in in multi class classification, the ROC surface is an N dimensional

/// shape, where N is number of classes - 1.


TCanvas * TMVA::Factory::GetROCCurve(TString datasetname, UInt_t iClass)

{

   if (fMethodsMap.find(datasetname) == fMethodsMap.end()) {

      Log() << kERROR << Form("DataSet = %s not found in methods map.", datasetname.Data()) << Endl;

      return 0;

   }


   TString name = Form("ROCCurve %s class %i", datasetname.Data(), iClass);

   TCanvas *canvas = new TCanvas(name, "ROC Curve", 200, 10, 700, 500);

   canvas->SetGrid();


   TMultiGraph *multigraph = this->GetROCCurveAsMultiGraph(datasetname, iClass);


   if ( multigraph ) {

      multigraph->Draw("AL");


      multigraph->GetYaxis()->SetTitle("Background rejection (Specificity)");

      multigraph->GetXaxis()->SetTitle("Signal efficiency (Sensitivity)");


      TString titleString = Form("Signal efficiency vs. Background rejection");

      if (this->fAnalysisType == Types::kMulticlass) {

         titleString = Form("%s (Class=%i)", titleString.Data(), iClass);

      }


      // Workaround for TMultigraph not drawing title correctly.

      multigraph->GetHistogram()->SetTitle( titleString );

      multigraph->SetTitle( titleString );


      canvas->BuildLegend(0.15, 0.15, 0.35, 0.3, "MVA Method");

   }


   return canvas;

}


////////////////////////////////////////////////////////////////////////////////

/// Iterates through all booked methods and calls training


void TMVA::Factory::TrainAllMethods()

{

    Log() << kHEADER << gTools().Color("bold") << "Train all methods" << gTools().Color("reset") << Endl;

   // iterates over all MVAs that have been booked, and calls their training methods


   // don't do anything if no method booked

   if (fMethodsMap.empty()) {

      Log() << kINFO << "...nothing found to train" << Endl;

      return;

   }


   // here the training starts

   //Log() << kINFO << " " << Endl;

   Log() << kDEBUG << "Train all methods for "

         << (fAnalysisType == Types::kRegression ? "Regression" :

             (fAnalysisType == Types::kMulticlass ? "Multiclass" : "Classification") ) << " ..." << Endl;


   std::map<TString,MVector*>::iterator itrMap;


   for(itrMap = fMethodsMap.begin();itrMap != fMethodsMap.end();++itrMap)

   {

      MVector *methods=itrMap->second;

      MVector::iterator itrMethod;


      // iterate over methods and train

      for( itrMethod = methods->begin(); itrMethod != methods->end(); ++itrMethod ) {

     Event::SetIsTraining(kTRUE);

     MethodBase* mva = dynamic_cast<MethodBase*>(*itrMethod);


     if(mva==0) continue;


     if(mva->DataInfo().GetDataSetManager()->DataInput().GetEntries() <=1) { // 0 entries --> 0 events, 1 entry --> dynamical dataset (or one entry)

         Log() << kFATAL << "No input data for the training provided!" << Endl;

     }


     if(fAnalysisType == Types::kRegression && mva->DataInfo().GetNTargets() < 1 )

     Log() << kFATAL << "You want to do regression training without specifying a target." << Endl;

     else if( (fAnalysisType == Types::kMulticlass || fAnalysisType == Types::kClassification)

      && mva->DataInfo().GetNClasses() < 2 )

     Log() << kFATAL << "You want to do classification training, but specified less than two classes." << Endl;


     // first print some information about the default dataset

     if(!IsSilentFile()) WriteDataInformation(mva->fDataSetInfo);


     if (mva->Data()->GetNTrainingEvents() < MinNoTrainingEvents) {

       Log() << kWARNING << "Method " << mva->GetMethodName()

        << " not trained (training tree has less entries ["

        << mva->Data()->GetNTrainingEvents()

        << "] than required [" << MinNoTrainingEvents << "]" << Endl;

       continue;

     }


     Log() << kHEADER << "Train method: " << mva->GetMethodName() << " for "

      << (fAnalysisType == Types::kRegression ? "Regression" :

          (fAnalysisType == Types::kMulticlass ? "Multiclass classification" : "Classification")) << Endl << Endl;

          mva->TrainMethod();

          Log() << kHEADER << "Training finished" << Endl << Endl;

      }


      if (fAnalysisType != Types::kRegression) {


     // variable ranking

     //Log() << Endl;

     Log() << kINFO << "Ranking input variables (method specific)..." << Endl;

     for (itrMethod = methods->begin(); itrMethod != methods->end(); ++itrMethod) {

       MethodBase* mva = dynamic_cast<MethodBase*>(*itrMethod);

       if (mva && mva->Data()->GetNTrainingEvents() >= MinNoTrainingEvents) {


      // create and print ranking

      const Ranking* ranking = (*itrMethod)->CreateRanking();

      if (ranking != 0) ranking->Print();

      else Log() << kINFO << "No variable ranking supplied by classifier: "

           << dynamic_cast<MethodBase*>(*itrMethod)->GetMethodName() << Endl;

       }

     }

      }


      // save training history in case we are not in the silent mode

      if (!IsSilentFile()) {

         for (UInt_t i=0; i<methods->size(); i++) {

            MethodBase* m = dynamic_cast<MethodBase*>((*methods)[i]);

            if(m==0) continue;

            m->BaseDir()->cd();

            m->fTrainHistory.SaveHistory(m->GetMethodName());

         }

      }


      // delete all methods and recreate them from weight file - this ensures that the application

      // of the methods (in TMVAClassificationApplication) is consistent with the results obtained

      // in the testing

      //Log() << Endl;

      if (fModelPersistence) {


      Log() << kHEADER << "=== Destroy and recreate all methods via weight files for testing ===" << Endl << Endl;


      if(!IsSilentFile())RootBaseDir()->cd();


     // iterate through all booked methods

     for (UInt_t i=0; i<methods->size(); i++) {


        MethodBase *m = dynamic_cast<MethodBase *>((*methods)[i]);

        if (m == nullptr)

           continue;


        TMVA::Types::EMVA methodType = m->GetMethodType();

        TString weightfile = m->GetWeightFileName();


        // decide if .txt or .xml file should be read:

        if (READXML)

           weightfile.ReplaceAll(".txt", ".xml");


        DataSetInfo &dataSetInfo = m->DataInfo();

        TString testvarName = m->GetTestvarName();

        delete m; // itrMethod[i];


        // recreate

        m = dynamic_cast<MethodBase *>(ClassifierFactory::Instance().Create(

           Types::Instance().GetMethodName(methodType).Data(), dataSetInfo, weightfile));

        if (m->GetMethodType() == Types::kCategory) {

           MethodCategory *methCat = (dynamic_cast<MethodCategory *>(m));

           if (!methCat)

              Log() << kFATAL << "Method with type kCategory cannot be casted to MethodCategory. /Factory" << Endl;

           else

              methCat->fDataSetManager = m->DataInfo().GetDataSetManager();

        }

        // ToDo, Do we need to fill the DataSetManager of MethodBoost here too?


        TString wfileDir = m->DataInfo().GetName();

        wfileDir += "/" + gConfig().GetIONames().fWeightFileDir;

        m->SetWeightFileDir(wfileDir);

        m->SetModelPersistence(fModelPersistence);

        m->SetSilentFile(IsSilentFile());

        m->SetAnalysisType(fAnalysisType);

        m->SetupMethod();

        m->ReadStateFromFile();

        m->SetTestvarName(testvarName);


        // replace trained method by newly created one (from weight file) in methods vector

        (*methods)[i] = m;

     }

       }

   }

}


////////////////////////////////////////////////////////////////////////////////

/// Evaluates all booked methods on the testing data and adds the output to the

/// Results in the corresponiding DataSet.

///


void TMVA::Factory::TestAllMethods()

{

   Log() << kHEADER << gTools().Color("bold") << "Test all methods" << gTools().Color("reset") << Endl;


   // don't do anything if no method booked

   if (fMethodsMap.empty()) {

      Log() << kINFO << "...nothing found to test" << Endl;

      return;

   }

   std::map<TString,MVector*>::iterator itrMap;


   for(itrMap = fMethodsMap.begin();itrMap != fMethodsMap.end();++itrMap)

   {

      MVector *methods=itrMap->second;

      MVector::iterator itrMethod;


      // iterate over methods and test

      for (itrMethod = methods->begin(); itrMethod != methods->end(); ++itrMethod) {

         Event::SetIsTraining(kFALSE);

         MethodBase *mva = dynamic_cast<MethodBase *>(*itrMethod);

         if (mva == 0)

            continue;

         Types::EAnalysisType analysisType = mva->GetAnalysisType();

         Log() << kHEADER << "Test method: " << mva->GetMethodName() << " for "

               << (analysisType == Types::kRegression

                      ? "Regression"

                      : (analysisType == Types::kMulticlass ? "Multiclass classification" : "Classification"))

               << " performance" << Endl << Endl;

         mva->AddOutput(Types::kTesting, analysisType);

      }

   }

}


////////////////////////////////////////////////////////////////////////////////


void TMVA::Factory::MakeClass(const TString& datasetname , const TString& methodTitle ) const

{

   if (methodTitle != "") {

      IMethod* method = GetMethod(datasetname, methodTitle);

      if (method) method->MakeClass();

      else {

         Log() << kWARNING << "<MakeClass> Could not find classifier \"" << methodTitle

               << "\" in list" << Endl;

      }

   }

   else {


      // no classifier specified, print all help messages

      MVector *methods=fMethodsMap.find(datasetname)->second;

      MVector::const_iterator itrMethod;

      for (itrMethod    = methods->begin(); itrMethod != methods->end(); ++itrMethod) {

         MethodBase* method = dynamic_cast<MethodBase*>(*itrMethod);

         if(method==0) continue;

         Log() << kINFO << "Make response class for classifier: " << method->GetMethodName() << Endl;

         method->MakeClass();

      }

   }

}


////////////////////////////////////////////////////////////////////////////////

/// Print predefined help message of classifier.

/// Iterate over methods and test.


void TMVA::Factory::PrintHelpMessage(const TString& datasetname , const TString& methodTitle ) const

{

   if (methodTitle != "") {

      IMethod* method = GetMethod(datasetname , methodTitle );

      if (method) method->PrintHelpMessage();

      else {

         Log() << kWARNING << "<PrintHelpMessage> Could not find classifier \"" << methodTitle

               << "\" in list" << Endl;

      }

   }

   else {


      // no classifier specified, print all help messages

      MVector *methods=fMethodsMap.find(datasetname)->second;

      MVector::const_iterator itrMethod ;

      for (itrMethod    = methods->begin(); itrMethod != methods->end(); ++itrMethod) {

         MethodBase* method = dynamic_cast<MethodBase*>(*itrMethod);

         if(method==0) continue;

         Log() << kINFO << "Print help message for classifier: " << method->GetMethodName() << Endl;

         method->PrintHelpMessage();

      }

   }

}


////////////////////////////////////////////////////////////////////////////////

/// Iterates over all MVA input variables and evaluates them.


void TMVA::Factory::EvaluateAllVariables(DataLoader *loader, TString options )

{

   Log() << kINFO << "Evaluating all variables..." << Endl;

   Event::SetIsTraining(kFALSE);


   for (UInt_t i=0; i<loader->GetDataSetInfo().GetNVariables(); i++) {

      TString s = loader->GetDataSetInfo().GetVariableInfo(i).GetLabel();

      if (options.Contains("V")) s += ":V";

      this->BookMethod(loader, "Variable", s );

   }

}


////////////////////////////////////////////////////////////////////////////////

/// Iterates over all MVAs that have been booked, and calls their evaluation methods.


void TMVA::Factory::EvaluateAllMethods( void )

{

   Log() << kHEADER << gTools().Color("bold") << "Evaluate all methods" << gTools().Color("reset") << Endl;


   // don't do anything if no method booked

   if (fMethodsMap.empty()) {

      Log() << kINFO << "...nothing found to evaluate" << Endl;

      return;

   }

   std::map<TString,MVector*>::iterator itrMap;


   for(itrMap = fMethodsMap.begin();itrMap != fMethodsMap.end();++itrMap)

   {

      MVector *methods=itrMap->second;


      // -----------------------------------------------------------------------

      // First part of evaluation process

      // --> compute efficiencies, and other separation estimators

      // -----------------------------------------------------------------------


      // although equal, we now want to separate the output for the variables

      // and the real methods

      Int_t isel;                  // will be 0 for a Method; 1 for a Variable

      Int_t nmeth_used[2] = {0,0}; // 0 Method; 1 Variable


      std::vector<std::vector<TString> >  mname(2);

      std::vector<std::vector<Double_t> > sig(2), sep(2), roc(2);

      std::vector<std::vector<Double_t> > eff01(2), eff10(2), eff30(2), effArea(2);

      std::vector<std::vector<Double_t> > eff01err(2), eff10err(2), eff30err(2);

      std::vector<std::vector<Double_t> > trainEff01(2), trainEff10(2), trainEff30(2);


      std::vector<std::vector<Float_t> > multiclass_testEff;

      std::vector<std::vector<Float_t> > multiclass_trainEff;

      std::vector<std::vector<Float_t> > multiclass_testPur;

      std::vector<std::vector<Float_t> > multiclass_trainPur;


      std::vector<std::vector<Float_t> > train_history;


      // Multiclass confusion matrices.

      std::vector<TMatrixD> multiclass_trainConfusionEffB01;

      std::vector<TMatrixD> multiclass_trainConfusionEffB10;

      std::vector<TMatrixD> multiclass_trainConfusionEffB30;

      std::vector<TMatrixD> multiclass_testConfusionEffB01;

      std::vector<TMatrixD> multiclass_testConfusionEffB10;

      std::vector<TMatrixD> multiclass_testConfusionEffB30;


      std::vector<std::vector<Double_t> > biastrain(1);  // "bias" of the regression on the training data

      std::vector<std::vector<Double_t> > biastest(1);   // "bias" of the regression on test data

      std::vector<std::vector<Double_t> > devtrain(1);   // "dev" of the regression on the training data

      std::vector<std::vector<Double_t> > devtest(1);    // "dev" of the regression on test data

      std::vector<std::vector<Double_t> > rmstrain(1);   // "rms" of the regression on the training data

      std::vector<std::vector<Double_t> > rmstest(1);    // "rms" of the regression on test data

      std::vector<std::vector<Double_t> > minftrain(1);  // "minf" of the regression on the training data

      std::vector<std::vector<Double_t> > minftest(1);   // "minf" of the regression on test data

      std::vector<std::vector<Double_t> > rhotrain(1);   // correlation of the regression on the training data

      std::vector<std::vector<Double_t> > rhotest(1);    // correlation of the regression on test data


      // same as above but for 'truncated' quantities (computed for events within 2sigma of RMS)

      std::vector<std::vector<Double_t> > biastrainT(1);

      std::vector<std::vector<Double_t> > biastestT(1);

      std::vector<std::vector<Double_t> > devtrainT(1);

      std::vector<std::vector<Double_t> > devtestT(1);

      std::vector<std::vector<Double_t> > rmstrainT(1);

      std::vector<std::vector<Double_t> > rmstestT(1);

      std::vector<std::vector<Double_t> > minftrainT(1);

      std::vector<std::vector<Double_t> > minftestT(1);


      // following vector contains all methods - with the exception of Cuts, which are special

      MVector methodsNoCuts;


      Bool_t doRegression = kFALSE;

      Bool_t doMulticlass = kFALSE;


      // iterate over methods and evaluate

      for (MVector::iterator itrMethod =methods->begin(); itrMethod != methods->end(); ++itrMethod) {

     Event::SetIsTraining(kFALSE);

     MethodBase* theMethod = dynamic_cast<MethodBase*>(*itrMethod);

     if(theMethod==0) continue;

     theMethod->SetFile(fgTargetFile);

     theMethod->SetSilentFile(IsSilentFile());

     if (theMethod->GetMethodType() != Types::kCuts) methodsNoCuts.push_back( *itrMethod );


     if (theMethod->DoRegression()) {

       doRegression = kTRUE;


       Log() << kINFO << "Evaluate regression method: " << theMethod->GetMethodName() << Endl;

       Double_t bias, dev, rms, mInf;

       Double_t biasT, devT, rmsT, mInfT;

       Double_t rho;


       Log() << kINFO << "TestRegression (testing)" << Endl;

       theMethod->TestRegression( bias, biasT, dev, devT, rms, rmsT, mInf, mInfT, rho, TMVA::Types::kTesting  );

       biastest[0]  .push_back( bias );

       devtest[0]   .push_back( dev );

       rmstest[0]   .push_back( rms );

       minftest[0]  .push_back( mInf );

       rhotest[0]   .push_back( rho );

       biastestT[0] .push_back( biasT );

       devtestT[0]  .push_back( devT );

       rmstestT[0]  .push_back( rmsT );

       minftestT[0] .push_back( mInfT );


       Log() << kINFO << "TestRegression (training)" << Endl;

       theMethod->TestRegression( bias, biasT, dev, devT, rms, rmsT, mInf, mInfT, rho, TMVA::Types::kTraining  );

       biastrain[0] .push_back( bias );

       devtrain[0]  .push_back( dev );

       rmstrain[0]  .push_back( rms );

       minftrain[0] .push_back( mInf );

       rhotrain[0]  .push_back( rho );

       biastrainT[0].push_back( biasT );

       devtrainT[0] .push_back( devT );

       rmstrainT[0] .push_back( rmsT );

       minftrainT[0].push_back( mInfT );


       mname[0].push_back( theMethod->GetMethodName() );

       nmeth_used[0]++;

       if (!IsSilentFile()) {

          Log() << kDEBUG << "\tWrite evaluation histograms to file" << Endl;

          theMethod->WriteEvaluationHistosToFile(Types::kTesting);

          theMethod->WriteEvaluationHistosToFile(Types::kTraining);

       }

     } else if (theMethod->DoMulticlass()) {

        // ====================================================================

        // === Multiclass evaluation

        // ====================================================================

        doMulticlass = kTRUE;

        Log() << kINFO << "Evaluate multiclass classification method: " << theMethod->GetMethodName() << Endl;


        // This part uses a genetic alg. to evaluate the optimal sig eff * sig pur.

        // This is why it is disabled for now.

        // Find approximate optimal working point w.r.t. signalEfficiency * signalPurity.

        // theMethod->TestMulticlass(); // This is where the actual GA calc is done

        // multiclass_testEff.push_back(theMethod->GetMulticlassEfficiency(multiclass_testPur));


        theMethod->TestMulticlass();


        // Confusion matrix at three background efficiency levels

        multiclass_trainConfusionEffB01.push_back(theMethod->GetMulticlassConfusionMatrix(0.01, Types::kTraining));

        multiclass_trainConfusionEffB10.push_back(theMethod->GetMulticlassConfusionMatrix(0.10, Types::kTraining));

        multiclass_trainConfusionEffB30.push_back(theMethod->GetMulticlassConfusionMatrix(0.30, Types::kTraining));


        multiclass_testConfusionEffB01.push_back(theMethod->GetMulticlassConfusionMatrix(0.01, Types::kTesting));

        multiclass_testConfusionEffB10.push_back(theMethod->GetMulticlassConfusionMatrix(0.10, Types::kTesting));

        multiclass_testConfusionEffB30.push_back(theMethod->GetMulticlassConfusionMatrix(0.30, Types::kTesting));


        if (!IsSilentFile()) {

           Log() << kDEBUG << "\tWrite evaluation histograms to file" << Endl;

           theMethod->WriteEvaluationHistosToFile(Types::kTesting);

           theMethod->WriteEvaluationHistosToFile(Types::kTraining);

        }


        nmeth_used[0]++;

        mname[0].push_back(theMethod->GetMethodName());

     } else {


        Log() << kHEADER << "Evaluate classifier: " << theMethod->GetMethodName() << Endl << Endl;

        isel = (theMethod->GetMethodTypeName().Contains("Variable")) ? 1 : 0;


        // perform the evaluation

        theMethod->TestClassification();


        // evaluate the classifier

        mname[isel].push_back(theMethod->GetMethodName());

        sig[isel].push_back(theMethod->GetSignificance());

        sep[isel].push_back(theMethod->GetSeparation());

        roc[isel].push_back(theMethod->GetROCIntegral());


        Double_t err;

        eff01[isel].push_back(theMethod->GetEfficiency("Efficiency:0.01", Types::kTesting, err));

        eff01err[isel].push_back(err);

        eff10[isel].push_back(theMethod->GetEfficiency("Efficiency:0.10", Types::kTesting, err));

        eff10err[isel].push_back(err);

        eff30[isel].push_back(theMethod->GetEfficiency("Efficiency:0.30", Types::kTesting, err));

        eff30err[isel].push_back(err);

        effArea[isel].push_back(theMethod->GetEfficiency("", Types::kTesting, err)); // computes the area (average)


        trainEff01[isel].push_back(theMethod->GetTrainingEfficiency("Efficiency:0.01")); // the first pass takes longer

        trainEff10[isel].push_back(theMethod->GetTrainingEfficiency("Efficiency:0.10"));

        trainEff30[isel].push_back(theMethod->GetTrainingEfficiency("Efficiency:0.30"));


        nmeth_used[isel]++;


        if (!IsSilentFile()) {

           Log() << kDEBUG << "\tWrite evaluation histograms to file" << Endl;

           theMethod->WriteEvaluationHistosToFile(Types::kTesting);

           theMethod->WriteEvaluationHistosToFile(Types::kTraining);

        }

     }

      }

      if (doRegression) {


     std::vector<TString> vtemps = mname[0];

     std::vector< std::vector<Double_t> > vtmp;

     vtmp.push_back( devtest[0]   );  // this is the vector that is ranked

     vtmp.push_back( devtrain[0]  );

     vtmp.push_back( biastest[0]  );

     vtmp.push_back( biastrain[0] );

     vtmp.push_back( rmstest[0]   );

     vtmp.push_back( rmstrain[0]  );

     vtmp.push_back( minftest[0]  );

     vtmp.push_back( minftrain[0] );

     vtmp.push_back( rhotest[0]   );

     vtmp.push_back( rhotrain[0]  );

     vtmp.push_back( devtestT[0]  );  // this is the vector that is ranked

     vtmp.push_back( devtrainT[0] );

     vtmp.push_back( biastestT[0] );

     vtmp.push_back( biastrainT[0]);

     vtmp.push_back( rmstestT[0]  );

     vtmp.push_back( rmstrainT[0] );

     vtmp.push_back( minftestT[0] );

     vtmp.push_back( minftrainT[0]);

     gTools().UsefulSortAscending( vtmp, &vtemps );

     mname[0]      = vtemps;

     devtest[0]    = vtmp[0];

     devtrain[0]   = vtmp[1];

     biastest[0]   = vtmp[2];

     biastrain[0]  = vtmp[3];

     rmstest[0]    = vtmp[4];

     rmstrain[0]   = vtmp[5];

     minftest[0]   = vtmp[6];

     minftrain[0]  = vtmp[7];

     rhotest[0]    = vtmp[8];

     rhotrain[0]   = vtmp[9];

     devtestT[0]   = vtmp[10];

     devtrainT[0]  = vtmp[11];

     biastestT[0]  = vtmp[12];

     biastrainT[0] = vtmp[13];

     rmstestT[0]   = vtmp[14];

     rmstrainT[0]  = vtmp[15];

     minftestT[0]  = vtmp[16];

     minftrainT[0] = vtmp[17];

      } else if (doMulticlass) {

         // TODO: fill in something meaningful

         // If there is some ranking of methods to be done it should be done here.

         // However, this is not so easy to define for multiclass so it is left out for now.


      }

      else {

     // now sort the variables according to the best 'eff at Beff=0.10'

     for (Int_t k=0; k<2; k++) {

       std::vector< std::vector<Double_t> > vtemp;

       vtemp.push_back( effArea[k] );  // this is the vector that is ranked

       vtemp.push_back( eff10[k] );

       vtemp.push_back( eff01[k] );

       vtemp.push_back( eff30[k] );

       vtemp.push_back( eff10err[k] );

       vtemp.push_back( eff01err[k] );

       vtemp.push_back( eff30err[k] );

       vtemp.push_back( trainEff10[k] );

       vtemp.push_back( trainEff01[k] );

       vtemp.push_back( trainEff30[k] );

       vtemp.push_back( sig[k] );

       vtemp.push_back( sep[k] );

       vtemp.push_back( roc[k] );

       std::vector<TString> vtemps = mname[k];

       gTools().UsefulSortDescending( vtemp, &vtemps );

       effArea[k]    = vtemp[0];

       eff10[k]      = vtemp[1];

       eff01[k]      = vtemp[2];

       eff30[k]      = vtemp[3];

       eff10err[k]   = vtemp[4];

       eff01err[k]   = vtemp[5];

       eff30err[k]   = vtemp[6];

       trainEff10[k] = vtemp[7];

       trainEff01[k] = vtemp[8];

       trainEff30[k] = vtemp[9];

       sig[k]        = vtemp[10];

       sep[k]        = vtemp[11];

       roc[k]        = vtemp[12];

       mname[k]      = vtemps;

     }

      }


      // -----------------------------------------------------------------------

      // Second part of evaluation process

      // --> compute correlations among MVAs

      // --> compute correlations between input variables and MVA (determines importance)

      // --> count overlaps

      // -----------------------------------------------------------------------

      if(fCorrelations)

      {

     const Int_t nmeth = methodsNoCuts.size();

     MethodBase* method = dynamic_cast<MethodBase*>(methods[0][0]);

     const Int_t nvar  = method->fDataSetInfo.GetNVariables();

     if (!doRegression && !doMulticlass ) {


         if (nmeth > 0) {


    //              needed for correlations

      Double_t *dvec = new Double_t[nmeth+nvar];

      std::vector<Double_t> rvec;


    //              for correlations

      TPrincipal* tpSig = new TPrincipal( nmeth+nvar, "" );

      TPrincipal* tpBkg = new TPrincipal( nmeth+nvar, "" );


    //              set required tree branch references

      Int_t ivar = 0;

      std::vector<TString>* theVars = new std::vector<TString>;

      std::vector<ResultsClassification*> mvaRes;

      for (MVector::iterator itrMethod = methodsNoCuts.begin(); itrMethod != methodsNoCuts.end(); ++itrMethod, ++ivar) {

          MethodBase* m = dynamic_cast<MethodBase*>(*itrMethod);

          if(m==0) continue;

          theVars->push_back( m->GetTestvarName() );

          rvec.push_back( m->GetSignalReferenceCut() );

          theVars->back().ReplaceAll( "MVA_", "" );

          mvaRes.push_back( dynamic_cast<ResultsClassification*>( m->Data()->GetResults( m->GetMethodName(),

                                      Types::kTesting,

                                      Types::kMaxAnalysisType) ) );

      }


    //              for overlap study

      TMatrixD* overlapS = new TMatrixD( nmeth, nmeth );

      TMatrixD* overlapB = new TMatrixD( nmeth, nmeth );

      (*overlapS) *= 0; // init...

      (*overlapB) *= 0; // init...


    //              loop over test tree

      DataSet* defDs = method->fDataSetInfo.GetDataSet();

      defDs->SetCurrentType(Types::kTesting);

      for (Int_t ievt=0; ievt<defDs->GetNEvents(); ievt++) {

          const Event* ev = defDs->GetEvent(ievt);


    //                 for correlations

          TMatrixD* theMat = 0;

          for (Int_t im=0; im<nmeth; im++) {

    //                    check for NaN value

            Double_t retval = (Double_t)(*mvaRes[im])[ievt][0];

            if (TMath::IsNaN(retval)) {

           Log() << kWARNING << "Found NaN return value in event: " << ievt

            << " for method \"" << methodsNoCuts[im]->GetName() << "\"" << Endl;

           dvec[im] = 0;

            }

            else dvec[im] = retval;

          }

          for (Int_t iv=0; iv<nvar;  iv++) dvec[iv+nmeth]  = (Double_t)ev->GetValue(iv);

          if (method->fDataSetInfo.IsSignal(ev)) { tpSig->AddRow( dvec ); theMat = overlapS; }

          else                                   { tpBkg->AddRow( dvec ); theMat = overlapB; }


    //                 count overlaps

          for (Int_t im=0; im<nmeth; im++) {

            for (Int_t jm=im; jm<nmeth; jm++) {

           if ((dvec[im] - rvec[im])*(dvec[jm] - rvec[jm]) > 0) {

             (*theMat)(im,jm)++;

             if (im != jm) (*theMat)(jm,im)++;

           }

            }

          }

      }


    //              renormalise overlap matrix

      (*overlapS) *= (1.0/defDs->GetNEvtSigTest());  // init...

      (*overlapB) *= (1.0/defDs->GetNEvtBkgdTest()); // init...


      tpSig->MakePrincipals();

      tpBkg->MakePrincipals();


      const TMatrixD* covMatS = tpSig->GetCovarianceMatrix();

      const TMatrixD* covMatB = tpBkg->GetCovarianceMatrix();


      const TMatrixD* corrMatS = gTools().GetCorrelationMatrix( covMatS );

      const TMatrixD* corrMatB = gTools().GetCorrelationMatrix( covMatB );


    //              print correlation matrices

      if (corrMatS != 0 && corrMatB != 0) {


    //                 extract MVA matrix

          TMatrixD mvaMatS(nmeth,nmeth);

          TMatrixD mvaMatB(nmeth,nmeth);

          for (Int_t im=0; im<nmeth; im++) {

            for (Int_t jm=0; jm<nmeth; jm++) {

           mvaMatS(im,jm) = (*corrMatS)(im,jm);

           mvaMatB(im,jm) = (*corrMatB)(im,jm);

            }

          }


    //                 extract variables - to MVA matrix

          std::vector<TString> theInputVars;

          TMatrixD varmvaMatS(nvar,nmeth);

          TMatrixD varmvaMatB(nvar,nmeth);

          for (Int_t iv=0; iv<nvar; iv++) {

            theInputVars.push_back( method->fDataSetInfo.GetVariableInfo( iv ).GetLabel() );

            for (Int_t jm=0; jm<nmeth; jm++) {

           varmvaMatS(iv,jm) = (*corrMatS)(nmeth+iv,jm);

           varmvaMatB(iv,jm) = (*corrMatB)(nmeth+iv,jm);

            }

          }


          if (nmeth > 1) {

            Log() << kINFO << Endl;

            Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "Inter-MVA correlation matrix (signal):" << Endl;

            gTools().FormattedOutput( mvaMatS, *theVars, Log() );

            Log() << kINFO << Endl;


            Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "Inter-MVA correlation matrix (background):" << Endl;

            gTools().FormattedOutput( mvaMatB, *theVars, Log() );

            Log() << kINFO << Endl;

          }


          Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "Correlations between input variables and MVA response (signal):" << Endl;

          gTools().FormattedOutput( varmvaMatS, theInputVars, *theVars, Log() );

          Log() << kINFO << Endl;


          Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "Correlations between input variables and MVA response (background):" << Endl;

          gTools().FormattedOutput( varmvaMatB, theInputVars, *theVars, Log() );

          Log() << kINFO << Endl;

      }

      else Log() << kWARNING <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "<TestAllMethods> cannot compute correlation matrices" << Endl;


    //              print overlap matrices

      Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "The following \"overlap\" matrices contain the fraction of events for which " << Endl;

      Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "the MVAs 'i' and 'j' have returned conform answers about \"signal-likeness\"" << Endl;

      Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "An event is signal-like, if its MVA output exceeds the following value:" << Endl;

      gTools().FormattedOutput( rvec, *theVars, "Method" , "Cut value", Log() );

      Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "which correspond to the working point: eff(signal) = 1 - eff(background)" << Endl;


    //              give notice that cut method has been excluded from this test

      if (nmeth != (Int_t)methods->size())

          Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "Note: no correlations and overlap with cut method are provided at present" << Endl;


      if (nmeth > 1) {

          Log() << kINFO << Endl;

          Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "Inter-MVA overlap matrix (signal):" << Endl;

          gTools().FormattedOutput( *overlapS, *theVars, Log() );

          Log() << kINFO << Endl;


          Log() << kINFO <<Form("Dataset[%s] : ",method->fDataSetInfo.GetName())<< "Inter-MVA overlap matrix (background):" << Endl;

          gTools().FormattedOutput( *overlapB, *theVars, Log() );

      }


    //              cleanup

      delete tpSig;

      delete tpBkg;

      delete corrMatS;

      delete corrMatB;

      delete theVars;

      delete overlapS;

      delete overlapB;

      delete [] dvec;

         }

     }

      }

      // -----------------------------------------------------------------------

      // Third part of evaluation process

      // --> output

      // -----------------------------------------------------------------------


      if (doRegression) {


     Log() << kINFO << Endl;

     TString hLine = "--------------------------------------------------------------------------------------------------";

     Log() << kINFO << "Evaluation results ranked by smallest RMS on test sample:" << Endl;

     Log() << kINFO << "(\"Bias\" quotes the mean deviation of the regression from true target." << Endl;

     Log() << kINFO << " \"MutInf\" is the \"Mutual Information\" between regression and target." << Endl;

     Log() << kINFO << " Indicated by \"_T\" are the corresponding \"truncated\" quantities ob-" << Endl;

     Log() << kINFO << " tained when removing events deviating more than 2sigma from average.)" << Endl;

     Log() << kINFO << hLine << Endl;

     //Log() << kINFO << "DataSet Name:        MVA Method:        <Bias>   <Bias_T>    RMS    RMS_T  |  MutInf MutInf_T" << Endl;

     Log() << kINFO << hLine << Endl;


     for (Int_t i=0; i<nmeth_used[0]; i++) {

       MethodBase* theMethod = dynamic_cast<MethodBase*>((*methods)[i]);

       if(theMethod==0) continue;


       Log() << kINFO << Form("%-20s %-15s:%#9.3g%#9.3g%#9.3g%#9.3g  |  %#5.3f  %#5.3f",

                    theMethod->fDataSetInfo.GetName(),

                    (const char*)mname[0][i],

                    biastest[0][i], biastestT[0][i],

                    rmstest[0][i], rmstestT[0][i],

                    minftest[0][i], minftestT[0][i] )

            << Endl;

     }

     Log() << kINFO << hLine << Endl;

     Log() << kINFO << Endl;

     Log() << kINFO << "Evaluation results ranked by smallest RMS on training sample:" << Endl;

     Log() << kINFO << "(overtraining check)" << Endl;

     Log() << kINFO << hLine << Endl;

     Log() << kINFO << "DataSet Name:         MVA Method:        <Bias>   <Bias_T>    RMS    RMS_T  |  MutInf MutInf_T" << Endl;

     Log() << kINFO << hLine << Endl;


     for (Int_t i=0; i<nmeth_used[0]; i++) {

       MethodBase* theMethod = dynamic_cast<MethodBase*>((*methods)[i]);

       if(theMethod==0) continue;

       Log() << kINFO << Form("%-20s %-15s:%#9.3g%#9.3g%#9.3g%#9.3g  |  %#5.3f  %#5.3f",

                    theMethod->fDataSetInfo.GetName(),

                    (const char*)mname[0][i],

                    biastrain[0][i], biastrainT[0][i],

                    rmstrain[0][i], rmstrainT[0][i],

                    minftrain[0][i], minftrainT[0][i] )

            << Endl;

     }

     Log() << kINFO << hLine << Endl;

     Log() << kINFO << Endl;

      } else if (doMulticlass) {

         // ====================================================================

         // === Multiclass Output

         // ====================================================================


         TString hLine =

            "-------------------------------------------------------------------------------------------------------";


         // This part uses a genetic alg. to evaluate the optimal sig eff * sig pur.

         // This is why it is disabled for now.

         //

         // // --- Acheivable signal efficiency * signal purity

         // // --------------------------------------------------------------------

         // Log() << kINFO << Endl;

         // Log() << kINFO << "Evaluation results ranked by best signal efficiency times signal purity " << Endl;

         // Log() << kINFO << hLine << Endl;


         // // iterate over methods and evaluate

         // for (MVector::iterator itrMethod = methods->begin(); itrMethod != methods->end(); itrMethod++) {

         //    MethodBase *theMethod = dynamic_cast<MethodBase *>(*itrMethod);

         //    if (theMethod == 0) {

         //       continue;

         //    }


         //    TString header = "DataSet Name     MVA Method     ";

         //    for (UInt_t icls = 0; icls < theMethod->fDataSetInfo.GetNClasses(); ++icls) {

         //       header += Form("%-12s ", theMethod->fDataSetInfo.GetClassInfo(icls)->GetName());

         //    }


         //    Log() << kINFO << header << Endl;

         //    Log() << kINFO << hLine << Endl;

         //    for (Int_t i = 0; i < nmeth_used[0]; i++) {

         //       TString res = Form("[%-14s] %-15s", theMethod->fDataSetInfo.GetName(), (const char *)mname[0][i]);

         //       for (UInt_t icls = 0; icls < theMethod->fDataSetInfo.GetNClasses(); ++icls) {

         //          res += Form("%#1.3f        ", (multiclass_testEff[i][icls]) * (multiclass_testPur[i][icls]));

         //       }

         //       Log() << kINFO << res << Endl;

         //    }


         //    Log() << kINFO << hLine << Endl;

         //    Log() << kINFO << Endl;

         // }


         // --- 1 vs Rest ROC AUC, signal efficiency @ given background efficiency

         // --------------------------------------------------------------------

         TString header1 = Form("%-15s%-15s%-15s%-15s%-15s%-15s", "Dataset", "MVA Method", "ROC AUC", "Sig eff@B=0.01",

                                "Sig eff@B=0.10", "Sig eff@B=0.30");

         TString header2 = Form("%-15s%-15s%-15s%-15s%-15s%-15s", "Name:", "/ Class:", "test  (train)", "test  (train)",

                                "test  (train)", "test  (train)");

         Log() << kINFO << Endl;

         Log() << kINFO << "1-vs-rest performance metrics per class" << Endl;

         Log() << kINFO << hLine << Endl;

         Log() << kINFO << Endl;

         Log() << kINFO << "Considers the listed class as signal and the other classes" << Endl;

         Log() << kINFO << "as background, reporting the resulting binary performance." << Endl;

         Log() << kINFO << "A score of 0.820 (0.850) means 0.820 was acheived on the" << Endl;

         Log() << kINFO << "test set and 0.850 on the training set." << Endl;


         Log() << kINFO << Endl;

         Log() << kINFO << header1 << Endl;

         Log() << kINFO << header2 << Endl;

         for (Int_t k = 0; k < 2; k++) {

            for (Int_t i = 0; i < nmeth_used[k]; i++) {

               if (k == 1) {

                  mname[k][i].ReplaceAll("Variable_", "");

               }


               const TString datasetName = itrMap->first;

               const TString mvaName = mname[k][i];


               MethodBase *theMethod = dynamic_cast<MethodBase *>(GetMethod(datasetName, mvaName));

               if (theMethod == 0) {

                  continue;

               }


               Log() << kINFO << Endl;

               TString row = Form("%-15s%-15s", datasetName.Data(), mvaName.Data());

               Log() << kINFO << row << Endl;

               Log() << kINFO << "------------------------------" << Endl;


               UInt_t numClasses = theMethod->fDataSetInfo.GetNClasses();

               for (UInt_t iClass = 0; iClass < numClasses; ++iClass) {


                  ROCCurve *rocCurveTrain = GetROC(datasetName, mvaName, iClass, Types::kTraining);

                  ROCCurve *rocCurveTest = GetROC(datasetName, mvaName, iClass, Types::kTesting);


                  const TString className = theMethod->DataInfo().GetClassInfo(iClass)->GetName();

                  const Double_t rocaucTrain = rocCurveTrain->GetROCIntegral();

                  const Double_t effB01Train = rocCurveTrain->GetEffSForEffB(0.01);

                  const Double_t effB10Train = rocCurveTrain->GetEffSForEffB(0.10);

                  const Double_t effB30Train = rocCurveTrain->GetEffSForEffB(0.30);

                  const Double_t rocaucTest = rocCurveTest->GetROCIntegral();

                  const Double_t effB01Test = rocCurveTest->GetEffSForEffB(0.01);

                  const Double_t effB10Test = rocCurveTest->GetEffSForEffB(0.10);

                  const Double_t effB30Test = rocCurveTest->GetEffSForEffB(0.30);

                  const TString rocaucCmp = Form("%5.3f (%5.3f)", rocaucTest, rocaucTrain);

                  const TString effB01Cmp = Form("%5.3f (%5.3f)", effB01Test, effB01Train);

                  const TString effB10Cmp = Form("%5.3f (%5.3f)", effB10Test, effB10Train);

                  const TString effB30Cmp = Form("%5.3f (%5.3f)", effB30Test, effB30Train);

                  row = Form("%-15s%-15s%-15s%-15s%-15s%-15s", "", className.Data(), rocaucCmp.Data(), effB01Cmp.Data(),

                             effB10Cmp.Data(), effB30Cmp.Data());

                  Log() << kINFO << row << Endl;


                  delete rocCurveTrain;

                  delete rocCurveTest;

               }

            }

         }

         Log() << kINFO << Endl;

         Log() << kINFO << hLine << Endl;

         Log() << kINFO << Endl;


         // --- Confusion matrices

         // --------------------------------------------------------------------

         auto printMatrix = [](TMatrixD const &matTraining, TMatrixD const &matTesting, std::vector<TString> classnames,

                               UInt_t numClasses, MsgLogger &stream) {

            // assert (classLabledWidth >= valueLabelWidth + 2)

            // if (...) {Log() << kWARN << "..." << Endl; }


            // TODO: Ensure matrices are same size.


            TString header = Form(" %-14s", " ");

            TString headerInfo = Form(" %-14s", " ");

            ;

            for (UInt_t iCol = 0; iCol < numClasses; ++iCol) {

               header += Form(" %-14s", classnames[iCol].Data());

               headerInfo += Form(" %-14s", " test (train)");

            }

            stream << kINFO << header << Endl;

            stream << kINFO << headerInfo << Endl;


            for (UInt_t iRow = 0; iRow < numClasses; ++iRow) {

               stream << kINFO << Form(" %-14s", classnames[iRow].Data());


               for (UInt_t iCol = 0; iCol < numClasses; ++iCol) {

                  if (iCol == iRow) {

                     stream << kINFO << Form(" %-14s", "-");

                  } else {

                     Double_t trainValue = matTraining[iRow][iCol];

                     Double_t testValue = matTesting[iRow][iCol];

                     TString entry = Form("%-5.3f (%-5.3f)", testValue, trainValue);

                     stream << kINFO << Form(" %-14s", entry.Data());

                  }

               }

               stream << kINFO << Endl;

            }

         };


         Log() << kINFO << Endl;

         Log() << kINFO << "Confusion matrices for all methods" << Endl;

         Log() << kINFO << hLine << Endl;

         Log() << kINFO << Endl;

         Log() << kINFO << "Does a binary comparison between the two classes given by a " << Endl;

         Log() << kINFO << "particular row-column combination. In each case, the class " << Endl;

         Log() << kINFO << "given by the row is considered signal while the class given " << Endl;

         Log() << kINFO << "by the column index is considered background." << Endl;

         Log() << kINFO << Endl;

         for (UInt_t iMethod = 0; iMethod < methods->size(); ++iMethod) {

            MethodBase *theMethod = dynamic_cast<MethodBase *>(methods->at(iMethod));

            if (theMethod == nullptr) {

               continue;

            }

            UInt_t numClasses = theMethod->fDataSetInfo.GetNClasses();


            std::vector<TString> classnames;

            for (UInt_t iCls = 0; iCls < numClasses; ++iCls) {

               classnames.push_back(theMethod->fDataSetInfo.GetClassInfo(iCls)->GetName());

            }

            Log() << kINFO

                  << "=== Showing confusion matrix for method : " << Form("%-15s", (const char *)mname[0][iMethod])

                  << Endl;

            Log() << kINFO << "(Signal Efficiency for Background Efficiency 0.01%)" << Endl;

            Log() << kINFO << "---------------------------------------------------" << Endl;

            printMatrix(multiclass_testConfusionEffB01[iMethod], multiclass_trainConfusionEffB01[iMethod], classnames,

                        numClasses, Log());

            Log() << kINFO << Endl;


            Log() << kINFO << "(Signal Efficiency for Background Efficiency 0.10%)" << Endl;

            Log() << kINFO << "---------------------------------------------------" << Endl;

            printMatrix(multiclass_testConfusionEffB10[iMethod], multiclass_trainConfusionEffB10[iMethod], classnames,

                        numClasses, Log());

            Log() << kINFO << Endl;


            Log() << kINFO << "(Signal Efficiency for Background Efficiency 0.30%)" << Endl;

            Log() << kINFO << "---------------------------------------------------" << Endl;

            printMatrix(multiclass_testConfusionEffB30[iMethod], multiclass_trainConfusionEffB30[iMethod], classnames,

                        numClasses, Log());

            Log() << kINFO << Endl;

         }

         Log() << kINFO << hLine << Endl;

         Log() << kINFO << Endl;


      } else {

         // Binary classification

         if (fROC) {

            Log().EnableOutput();

            gConfig().SetSilent(kFALSE);

            Log() << Endl;

            TString hLine = "------------------------------------------------------------------------------------------"

                            "-------------------------";

            Log() << kINFO << "Evaluation results ranked by best signal efficiency and purity (area)" << Endl;

            Log() << kINFO << hLine << Endl;

            Log() << kINFO << "DataSet       MVA                       " << Endl;

            Log() << kINFO << "Name:         Method:          ROC-integ" << Endl;


            //       Log() << kDEBUG << "DataSet              MVA              Signal efficiency at bkg eff.(error):

            //       | Sepa-    Signifi- "   << Endl; Log() << kDEBUG << "Name:                Method:          @B=0.01

            //       @B=0.10    @B=0.30    ROC-integ    ROCCurve| ration:  cance:   "   << Endl;

            Log() << kDEBUG << hLine << Endl;

            for (Int_t k = 0; k < 2; k++) {

               if (k == 1 && nmeth_used[k] > 0) {

                  Log() << kINFO << hLine << Endl;

                  Log() << kINFO << "Input Variables: " << Endl << hLine << Endl;

               }

               for (Int_t i = 0; i < nmeth_used[k]; i++) {

                  TString datasetName = itrMap->first;

                  TString methodName = mname[k][i];


                  if (k == 1) {

                     methodName.ReplaceAll("Variable_", "");

                  }


                  MethodBase *theMethod = dynamic_cast<MethodBase *>(GetMethod(datasetName, methodName));

                  if (theMethod == 0) {

                     continue;

                  }


                  TMVA::DataSet *dataset = theMethod->Data();

                  TMVA::Results *results = dataset->GetResults(methodName, Types::kTesting, this->fAnalysisType);

                  std::vector<Bool_t> *mvaResType =

                     dynamic_cast<ResultsClassification *>(results)->GetValueVectorTypes();


                  Double_t rocIntegral = 0.0;

                  if (mvaResType->size() != 0) {

                     rocIntegral = GetROCIntegral(datasetName, methodName);

                  }


                  if (sep[k][i] < 0 || sig[k][i] < 0) {

                     // cannot compute separation/significance -> no MVA (usually for Cuts)

                     Log() << kINFO << Form("%-13s %-15s: %#1.3f", datasetName.Data(), methodName.Data(), effArea[k][i])

                           << Endl;


                     //               Log() << kDEBUG << Form("%-20s %-15s: %#1.3f(%02i)  %#1.3f(%02i)  %#1.3f(%02i)

                     //               %#1.3f       %#1.3f | --       --",

                     //                       datasetName.Data(),

                     //                       methodName.Data(),

                     //                       eff01[k][i], Int_t(1000*eff01err[k][i]),

                     //                       eff10[k][i], Int_t(1000*eff10err[k][i]),

                     //                       eff30[k][i], Int_t(1000*eff30err[k][i]),

                     //                       effArea[k][i],rocIntegral) << Endl;

                  } else {

                     Log() << kINFO << Form("%-13s %-15s: %#1.3f", datasetName.Data(), methodName.Data(), rocIntegral)

                           << Endl;

                     //               Log() << kDEBUG << Form("%-20s %-15s: %#1.3f(%02i)  %#1.3f(%02i)  %#1.3f(%02i)

                     //               %#1.3f       %#1.3f | %#1.3f    %#1.3f",

                     //                       datasetName.Data(),

                     //                       methodName.Data(),

                     //                       eff01[k][i], Int_t(1000*eff01err[k][i]),

                     //                       eff10[k][i], Int_t(1000*eff10err[k][i]),

                     //                       eff30[k][i], Int_t(1000*eff30err[k][i]),

                     //                       effArea[k][i],rocIntegral,

                     //                       sep[k][i], sig[k][i]) << Endl;

                  }

               }

            }

            Log() << kINFO << hLine << Endl;

            Log() << kINFO << Endl;

            Log() << kINFO << "Testing efficiency compared to training efficiency (overtraining check)" << Endl;

            Log() << kINFO << hLine << Endl;

            Log() << kINFO

                  << "DataSet              MVA              Signal efficiency: from test sample (from training sample) "

                  << Endl;

            Log() << kINFO << "Name:                Method:          @B=0.01             @B=0.10            @B=0.30   "

                  << Endl;

            Log() << kINFO << hLine << Endl;

            for (Int_t k = 0; k < 2; k++) {

               if (k == 1 && nmeth_used[k] > 0) {

                  Log() << kINFO << hLine << Endl;

                  Log() << kINFO << "Input Variables: " << Endl << hLine << Endl;

               }

               for (Int_t i = 0; i < nmeth_used[k]; i++) {

                  if (k == 1) mname[k][i].ReplaceAll("Variable_", "");

                  MethodBase *theMethod = dynamic_cast<MethodBase *>((*methods)[i]);

                  if (theMethod == 0) continue;


                  Log() << kINFO << Form("%-20s %-15s: %#1.3f (%#1.3f)       %#1.3f (%#1.3f)      %#1.3f (%#1.3f)",

                                         theMethod->fDataSetInfo.GetName(), (const char *)mname[k][i], eff01[k][i],

                                         trainEff01[k][i], eff10[k][i], trainEff10[k][i], eff30[k][i], trainEff30[k][i])

                        << Endl;

               }

            }

            Log() << kINFO << hLine << Endl;

            Log() << kINFO << Endl;


            if (gTools().CheckForSilentOption(GetOptions())) Log().InhibitOutput();

         } // end fROC

     }

     if(!IsSilentFile())

     {

         std::list<TString> datasets;

         for (Int_t k=0; k<2; k++) {

      for (Int_t i=0; i<nmeth_used[k]; i++) {

          MethodBase* theMethod = dynamic_cast<MethodBase*>((*methods)[i]);

          if(theMethod==0) continue;

          // write test/training trees

          RootBaseDir()->cd(theMethod->fDataSetInfo.GetName());

          if(std::find(datasets.begin(), datasets.end(), theMethod->fDataSetInfo.GetName()) == datasets.end())

          {

            theMethod->fDataSetInfo.GetDataSet()->GetTree(Types::kTesting)->Write( "", TObject::kOverwrite );

            theMethod->fDataSetInfo.GetDataSet()->GetTree(Types::kTraining)->Write( "", TObject::kOverwrite );

            datasets.push_back(theMethod->fDataSetInfo.GetName());

          }

      }

         }

     }

   }//end for MethodsMap

   // references for citation

   gTools().TMVACitation( Log(), Tools::kHtmlLink );

}


////////////////////////////////////////////////////////////////////////////////

/// Evaluate Variable Importance


TH1F* TMVA::Factory::EvaluateImportance(DataLoader *loader,VIType vitype, Types::EMVA theMethod,  TString methodTitle, const char *theOption)

{

  fModelPersistence=kFALSE;

  fSilentFile=kTRUE;//we need silent file here because we need fast classification results


  //getting number of variables and variable names from loader

  const int nbits = loader->GetDataSetInfo().GetNVariables();

  if(vitype==VIType::kShort)

  return EvaluateImportanceShort(loader,theMethod,methodTitle,theOption);

  else if(vitype==VIType::kAll)

  return EvaluateImportanceAll(loader,theMethod,methodTitle,theOption);

  else if(vitype==VIType::kRandom&&nbits>10)

  {

      return EvaluateImportanceRandom(loader,pow(2,nbits),theMethod,methodTitle,theOption);

  }else

  {

      std::cerr<<"Error in Variable Importance: Random mode require more that 10 variables in the dataset."<<std::endl;

      return nullptr;

  }

}


////////////////////////////////////////////////////////////////////////////////


TH1F* TMVA::Factory::EvaluateImportanceAll(DataLoader *loader, Types::EMVA theMethod,  TString methodTitle, const char *theOption)

{


  uint64_t x = 0;

  uint64_t y = 0;


  //getting number of variables and variable names from loader

  const int nbits = loader->GetDataSetInfo().GetNVariables();

  std::vector<TString> varNames = loader->GetDataSetInfo().GetListOfVariables();


  uint64_t range = pow(2, nbits);


  //vector to save importances

  std::vector<Double_t> importances(nbits);

  //vector to save ROC

  std::vector<Double_t> ROC(range);

  ROC[0]=0.5;

  for (int i = 0; i < nbits; i++)importances[i] = 0;


  Double_t SROC, SSROC; //computed ROC value

  for ( x = 1; x <range ; x++) {


    std::bitset<VIBITS>  xbitset(x);

    if (x == 0) continue; //data loader need at least one variable


    //creating loader for seed

    TMVA::DataLoader *seedloader = new TMVA::DataLoader(xbitset.to_string());


    //adding variables from seed

    for (int index = 0; index < nbits; index++) {

      if (xbitset[index]) seedloader->AddVariable(varNames[index], 'F');

    }


    DataLoaderCopy(seedloader,loader);

    seedloader->PrepareTrainingAndTestTree(loader->GetDataSetInfo().GetCut("Signal"), loader->GetDataSetInfo().GetCut("Background"), loader->GetDataSetInfo().GetSplitOptions());


    //Booking Seed

    BookMethod(seedloader, theMethod, methodTitle, theOption);


    //Train/Test/Evaluation

    TrainAllMethods();

    TestAllMethods();

    EvaluateAllMethods();


    //getting ROC

    ROC[x] = GetROCIntegral(xbitset.to_string(), methodTitle);


    //cleaning information to process sub-seeds

    TMVA::MethodBase *smethod=dynamic_cast<TMVA::MethodBase*>(fMethodsMap[xbitset.to_string().c_str()][0][0]);

    TMVA::ResultsClassification  *sresults = (TMVA::ResultsClassification*)smethod->Data()->GetResults(smethod->GetMethodName(), Types::kTesting, Types::kClassification);

    delete sresults;

    delete seedloader;

    this->DeleteAllMethods();


    fMethodsMap.clear();

    //removing global result because it is requiring a lot of RAM for all seeds

  }


  for ( x = 0; x <range ; x++)

  {

    SROC=ROC[x];

    for (uint32_t i = 0; i < VIBITS; ++i) {

      if (x & (1 << i)) {

   y = x & ~(1 << i);

   std::bitset<VIBITS>  ybitset(y);

   //need at least one variable

   //NOTE: if sub-seed is zero then is the special case

   //that count in xbitset is 1

   Double_t ny = log(x - y) / 0.693147;

   if (y == 0) {

     importances[ny] = SROC - 0.5;

     continue;

   }


   //getting ROC

   SSROC = ROC[y];

   importances[ny] += SROC - SSROC;

   //cleaning information

      }


    }

  }

   std::cout<<"--- Variable Importance Results (All)"<<std::endl;

   return GetImportance(nbits,importances,varNames);

}


static long int sum(long int i)

{

  long int _sum=0;

  for(long int n=0;n<i;n++) _sum+=pow(2,n);

  return _sum;

}


////////////////////////////////////////////////////////////////////////////////


TH1F* TMVA::Factory::EvaluateImportanceShort(DataLoader *loader, Types::EMVA theMethod,  TString methodTitle, const char *theOption)

{

  uint64_t x = 0;

  uint64_t y = 0;


  //getting number of variables and variable names from loader

  const int nbits = loader->GetDataSetInfo().GetNVariables();

  std::vector<TString> varNames = loader->GetDataSetInfo().GetListOfVariables();


  long int range = sum(nbits);

//   std::cout<<range<<std::endl;

  //vector to save importances

  std::vector<Double_t> importances(nbits);

  for (int i = 0; i < nbits; i++)importances[i] = 0;


  Double_t SROC, SSROC; //computed ROC value


  x = range;


  std::bitset<VIBITS>  xbitset(x);

  if (x == 0) Log()<<kFATAL<<"Error: need at least one variable."; //data loader need at least one variable


  //creating loader for seed

  TMVA::DataLoader *seedloader = new TMVA::DataLoader(xbitset.to_string());


  //adding variables from seed

  for (int index = 0; index < nbits; index++) {

    if (xbitset[index]) seedloader->AddVariable(varNames[index], 'F');

  }


  //Loading Dataset

  DataLoaderCopy(seedloader,loader);


  //Booking Seed

  BookMethod(seedloader, theMethod, methodTitle, theOption);


  //Train/Test/Evaluation

  TrainAllMethods();

  TestAllMethods();

  EvaluateAllMethods();


  //getting ROC

  SROC = GetROCIntegral(xbitset.to_string(), methodTitle);


  //cleaning information to process sub-seeds

  TMVA::MethodBase *smethod=dynamic_cast<TMVA::MethodBase*>(fMethodsMap[xbitset.to_string().c_str()][0][0]);

  TMVA::ResultsClassification  *sresults = (TMVA::ResultsClassification*)smethod->Data()->GetResults(smethod->GetMethodName(), Types::kTesting, Types::kClassification);

  delete sresults;

  delete seedloader;

  this->DeleteAllMethods();

  fMethodsMap.clear();


  //removing global result because it is requiring a lot of RAM for all seeds


  for (uint32_t i = 0; i < VIBITS; ++i) {

    if (x & (1 << i)) {

      y = x & ~(1 << i);

      std::bitset<VIBITS>  ybitset(y);

      //need at least one variable

      //NOTE: if sub-seed is zero then is the special case

      //that count in xbitset is 1

      Double_t ny = log(x - y) / 0.693147;

      if (y == 0) {

   importances[ny] = SROC - 0.5;

   continue;

      }


      //creating loader for sub-seed

      TMVA::DataLoader *subseedloader = new TMVA::DataLoader(ybitset.to_string());

      //adding variables from sub-seed

      for (int index = 0; index < nbits; index++) {

   if (ybitset[index]) subseedloader->AddVariable(varNames[index], 'F');

      }


      //Loading Dataset

      DataLoaderCopy(subseedloader,loader);


      //Booking SubSeed

      BookMethod(subseedloader, theMethod, methodTitle, theOption);


      //Train/Test/Evaluation

      TrainAllMethods();

      TestAllMethods();

      EvaluateAllMethods();


      //getting ROC

      SSROC = GetROCIntegral(ybitset.to_string(), methodTitle);

      importances[ny] += SROC - SSROC;


      //cleaning information

      TMVA::MethodBase *ssmethod=dynamic_cast<TMVA::MethodBase*>(fMethodsMap[ybitset.to_string().c_str()][0][0]);

      TMVA::ResultsClassification *ssresults = (TMVA::ResultsClassification*)ssmethod->Data()->GetResults(ssmethod->GetMethodName(), Types::kTesting, Types::kClassification);

      delete ssresults;

      delete subseedloader;

      this->DeleteAllMethods();

      fMethodsMap.clear();

    }

  }

   std::cout<<"--- Variable Importance Results (Short)"<<std::endl;

   return GetImportance(nbits,importances,varNames);

}


////////////////////////////////////////////////////////////////////////////////


TH1F* TMVA::Factory::EvaluateImportanceRandom(DataLoader *loader, UInt_t nseeds, Types::EMVA theMethod,  TString methodTitle, const char *theOption)

{

   TRandom3 *rangen = new TRandom3(0);  //Random Gen.


   uint64_t x = 0;

   uint64_t y = 0;


   //getting number of variables and variable names from loader

   const int nbits = loader->GetDataSetInfo().GetNVariables();

   std::vector<TString> varNames = loader->GetDataSetInfo().GetListOfVariables();


   long int range = pow(2, nbits);


   //vector to save importances

   std::vector<Double_t> importances(nbits);

   Double_t importances_norm = 0;

   for (int i = 0; i < nbits; i++)importances[i] = 0;


   Double_t SROC, SSROC; //computed ROC value

   for (UInt_t n = 0; n < nseeds; n++) {

      x = rangen -> Integer(range);


      std::bitset<32>  xbitset(x);

      if (x == 0) continue; //data loader need at least one variable


      //creating loader for seed

      TMVA::DataLoader *seedloader = new TMVA::DataLoader(xbitset.to_string());


      //adding variables from seed

      for (int index = 0; index < nbits; index++) {

         if (xbitset[index]) seedloader->AddVariable(varNames[index], 'F');

      }


      //Loading Dataset

      DataLoaderCopy(seedloader,loader);


      //Booking Seed

      BookMethod(seedloader, theMethod, methodTitle, theOption);


      //Train/Test/Evaluation

      TrainAllMethods();

      TestAllMethods();

      EvaluateAllMethods();


      //getting ROC

      SROC = GetROCIntegral(xbitset.to_string(), methodTitle);

//       std::cout << "Seed: n " << n << " x " << x << " xbitset:" << xbitset << "  ROC " << SROC << std::endl;


      //cleaning information to process sub-seeds

      TMVA::MethodBase *smethod=dynamic_cast<TMVA::MethodBase*>(fMethodsMap[xbitset.to_string().c_str()][0][0]);

      TMVA::ResultsClassification  *sresults = (TMVA::ResultsClassification*)smethod->Data()->GetResults(smethod->GetMethodName(), Types::kTesting, Types::kClassification);

      delete sresults;

      delete seedloader;

      this->DeleteAllMethods();

      fMethodsMap.clear();


      //removing global result because it is requiring a lot of RAM for all seeds


      for (uint32_t i = 0; i < 32; ++i) {

         if (x & (1 << i)) {

            y = x & ~(1 << i);

            std::bitset<32>  ybitset(y);

            //need at least one variable

            //NOTE: if sub-seed is zero then is the special case

            //that count in xbitset is 1

            Double_t ny = log(x - y) / 0.693147;

            if (y == 0) {

               importances[ny] = SROC - 0.5;

               importances_norm += importances[ny];

             //  std::cout << "SubSeed: " << y << " y:" << ybitset << "ROC " << 0.5 << std::endl;

               continue;

            }


            //creating loader for sub-seed

            TMVA::DataLoader *subseedloader = new TMVA::DataLoader(ybitset.to_string());

            //adding variables from sub-seed

            for (int index = 0; index < nbits; index++) {

               if (ybitset[index]) subseedloader->AddVariable(varNames[index], 'F');

            }


            //Loading Dataset

            DataLoaderCopy(subseedloader,loader);


            //Booking SubSeed

            BookMethod(subseedloader, theMethod, methodTitle, theOption);


            //Train/Test/Evaluation

            TrainAllMethods();

            TestAllMethods();

            EvaluateAllMethods();


            //getting ROC

            SSROC = GetROCIntegral(ybitset.to_string(), methodTitle);

            importances[ny] += SROC - SSROC;

            //std::cout << "SubSeed: " << y << " y:" << ybitset << " x-y " << x - y << " " << std::bitset<32>(x - y) << " ny " << ny << " SROC " << SROC << " SSROC " << SSROC << " Importance = " << importances[ny] << std::endl;

            //cleaning information

       TMVA::MethodBase *ssmethod=dynamic_cast<TMVA::MethodBase*>(fMethodsMap[ybitset.to_string().c_str()][0][0]);

            TMVA::ResultsClassification *ssresults = (TMVA::ResultsClassification*)ssmethod->Data()->GetResults(ssmethod->GetMethodName(), Types::kTesting, Types::kClassification);

            delete ssresults;

            delete subseedloader;

            this->DeleteAllMethods();

            fMethodsMap.clear();

         }

      }

   }

   std::cout<<"--- Variable Importance Results (Random)"<<std::endl;

   return GetImportance(nbits,importances,varNames);

}


////////////////////////////////////////////////////////////////////////////////


TH1F* TMVA::Factory::GetImportance(const int nbits,std::vector<Double_t> importances,std::vector<TString> varNames)

{

  TH1F *vih1  = new TH1F("vih1", "", nbits, 0, nbits);


  gStyle->SetOptStat(000000);


  Float_t normalization = 0.0;

  for (int i = 0; i < nbits; i++) {

    normalization = normalization + importances[i];

  }


  Float_t roc = 0.0;


  gStyle->SetTitleXOffset(0.4);

  gStyle->SetTitleXOffset(1.2);


  std::vector<Double_t> x_ie(nbits), y_ie(nbits);

  for (Int_t i = 1; i < nbits + 1; i++) {

    x_ie[i - 1] = (i - 1) * 1.;

    roc = 100.0 * importances[i - 1] / normalization;

    y_ie[i - 1] = roc;

    std::cout<<"--- "<<varNames[i-1]<<" = "<<roc<<" %"<<std::endl;

    vih1->GetXaxis()->SetBinLabel(i, varNames[i - 1].Data());

    vih1->SetBinContent(i, roc);

  }

  TGraph *g_ie = new TGraph(nbits + 2, &x_ie[0], &y_ie[0]);

  g_ie->SetTitle("");


  vih1->LabelsOption("v >", "X");

  vih1->SetBarWidth(0.97);

  Int_t ca = TColor::GetColor("#006600");

  vih1->SetFillColor(ca);

  //Int_t ci = TColor::GetColor("#990000");


  vih1->GetYaxis()->SetTitle("Importance (%)");

  vih1->GetYaxis()->SetTitleSize(0.045);

  vih1->GetYaxis()->CenterTitle();

  vih1->GetYaxis()->SetTitleOffset(1.24);


  vih1->GetYaxis()->SetRangeUser(-7, 50);

  vih1->SetDirectory(0);


//   vih1->Draw("B");

  return vih1;

}

ClassifierFactory.h

Config.h

Configurable.h

DataInputHandler.h

DataLoader.h

DataSetInfo.h

DataSetManager.h

DataSet.h

IMethod.h

MethodBase.h

MethodBoost.h

MethodCategory.h

MsgLogger.h

ROCCalc.h

ROCCurve.h

h
#define h(i)
Definition: RSha256.hxx:106

Ranking.h

ResultsClassification.h

ResultsMulticlass.h

ResultsRegression.h

Results.h

Int_t
int Int_t
Definition: RtypesCore.h:41

UInt_t
unsigned int UInt_t
Definition: RtypesCore.h:42

kFALSE
const Bool_t kFALSE
Definition: RtypesCore.h:88

Bool_t
bool Bool_t
Definition: RtypesCore.h:59

Double_t
double Double_t
Definition: RtypesCore.h:55

Float_t
float Float_t
Definition: RtypesCore.h:53

kTRUE
const Bool_t kTRUE
Definition: RtypesCore.h:87

ClassImp
#define ClassImp(name)
Definition: Rtypes.h:365

TCanvas.h

TEventList.h

TFile.h

name
char name[80]
Definition: TGX11.cxx:109

type
int type
Definition: TGX11.cxx:120

TGraph.h

TH2.h

TLeaf.h

TLegend.h

TMath.h

pow
double pow(double, double)

log
double log(double)

TMatrixDSym.h

TMatrixD
TMatrixT< Double_t > TMatrixD
Definition: TMatrixDfwd.h:22

TMatrixF.h

TMultiGraph.h

TObjString.h

TPaletteAxis.h

TPrincipal.h

TROOT.h

gROOT
#define gROOT
Definition: TROOT.h:415

Form
char * Form(const char *fmt,...)

TStyle.h

gStyle
R__EXTERN TStyle * gStyle
Definition: TStyle.h:407

TSystem.h

gSystem
R__EXTERN TSystem * gSystem
Definition: TSystem.h:560

TText.h

TTree.h

Tools.h

VariableInfo.h

VariableTransform.h

TAttAxis::SetTitleOffset
virtual void SetTitleOffset(Float_t offset=1)
Set distance between the axis and the axis title.
Definition: TAttAxis.cxx:294

TAttAxis::SetTitleSize
virtual void SetTitleSize(Float_t size=0.04)
Set size of axis title.
Definition: TAttAxis.cxx:304

TAttFill::SetFillColor
virtual void SetFillColor(Color_t fcolor)
Set the fill area color.
Definition: TAttFill.h:37

TAxis::SetBinLabel
virtual void SetBinLabel(Int_t bin, const char *label)
Set label for bin.
Definition: TAxis.cxx:809

TAxis::CenterTitle
void CenterTitle(Bool_t center=kTRUE)
Center axis title.
Definition: TAxis.h:184

TAxis::SetRangeUser
virtual void SetRangeUser(Double_t ufirst, Double_t ulast)
Set the viewing range for the axis from ufirst to ulast (in user coordinates).
Definition: TAxis.cxx:928

TCanvas
The Canvas class.
Definition: TCanvas.h:31

TColor::GetColor
static Int_t GetColor(const char *hexcolor)
Static method returning color number for color specified by hex color string of form: "#rrggbb",...
Definition: TColor.cxx:1764

TFile
A ROOT file is a suite of consecutive data records (TKey instances) with a well defined format.
Definition: TFile.h:48

TGraph
A Graph is a graphics object made of two arrays X and Y with npoints each.
Definition: TGraph.h:41

TGraph::SetTitle
virtual void SetTitle(const char *title="")
Change (i.e.
Definition: TGraph.cxx:2312

TH1F
1-D histogram with a float per channel (see TH1 documentation)}
Definition: TH1.h:571

TH1::SetDirectory
virtual void SetDirectory(TDirectory *dir)
By default when an histogram is created, it is added to the list of histogram objects in the current ...
Definition: TH1.cxx:8381

TH1::SetTitle
virtual void SetTitle(const char *title)
See GetStatOverflows for more information.
Definition: TH1.cxx:6333

TH1::LabelsOption
virtual void LabelsOption(Option_t *option="h", Option_t *axis="X")
Set option(s) to draw axis with labels.
Definition: TH1.cxx:5214

TH1::AddDirectory
static void AddDirectory(Bool_t add=kTRUE)
Sets the flag controlling the automatic add of histograms in memory.
Definition: TH1.cxx:1226

TH1::GetXaxis
TAxis * GetXaxis()
Get the behaviour adopted by the object about the statoverflows. See EStatOverflows for more informat...
Definition: TH1.h:316

TH1::GetYaxis
TAxis * GetYaxis()
Definition: TH1.h:317

TH1::SetBarWidth
virtual void SetBarWidth(Float_t width=0.5)
Definition: TH1.h:356

TH1::SetBinContent
virtual void SetBinContent(Int_t bin, Double_t content)
Set bin content see convention for numbering bins in TH1::GetBin In case the bin number is greater th...
Definition: TH1.cxx:8666

TH2
Service class for 2-Dim histogram classes.
Definition: TH2.h:30

TMVA::ClassifierFactory::Create
IMethod * Create(const std::string &name, const TString &job, const TString &title, DataSetInfo &dsi, const TString &option)
creates the method if needed based on the method name using the creator function the factory has stor...
Definition: ClassifierFactory.cxx:89

TMVA::ClassifierFactory::Instance
static ClassifierFactory & Instance()
access to the ClassifierFactory singleton creates the instance if needed
Definition: ClassifierFactory.cxx:48

TMVA::Config::IONames::fWeightFileDir
TString fWeightFileDir
Definition: Config.h:124

TMVA::Config::IONames::fWeightFileDirPrefix
TString fWeightFileDirPrefix
Definition: Config.h:123

TMVA::Config::VariablePlotting::fNbinsXOfROCCurve
Int_t fNbinsXOfROCCurve
Definition: Config.h:113

TMVA::Config::SetDrawProgressBar
void SetDrawProgressBar(Bool_t d)
Definition: Config.h:71

TMVA::Config::SetUseColor
void SetUseColor(Bool_t uc)
Definition: Config.h:62

TMVA::Config::fVariablePlotting
class TMVA::Config::VariablePlotting fVariablePlotting

TMVA::Config::SetSilent
void SetSilent(Bool_t s)
Definition: Config.h:65

TMVA::Config::GetIONames
IONames & GetIONames()
Definition: Config.h:100

TMVA::Configurable
Definition: Configurable.h:45

TMVA::Configurable::SetConfigDescription
void SetConfigDescription(const char *d)
Definition: Configurable.h:64

TMVA::Configurable::DeclareOptionRef
OptionBase * DeclareOptionRef(T &ref, const TString &name, const TString &desc="")

TMVA::Configurable::AddPreDefVal
void AddPreDefVal(const T &)
Definition: Configurable.h:168

TMVA::Configurable::SetConfigName
void SetConfigName(const char *n)
Definition: Configurable.h:63

TMVA::Configurable::ParseOptions
virtual void ParseOptions()
options parser
Definition: Configurable.cxx:128

TMVA::Configurable::GetOptions
const TString & GetOptions() const
Definition: Configurable.h:84

TMVA::Configurable::Log
MsgLogger & Log() const
Definition: Configurable.h:122

TMVA::Configurable::fLogger
MsgLogger * fLogger
Definition: Configurable.h:128

TMVA::Configurable::CheckForUnusedOptions
void CheckForUnusedOptions() const
checks for unused options in option string
Definition: Configurable.cxx:274

TMVA::DataInputHandler::GetEntries
UInt_t GetEntries(const TString &name) const
Definition: DataInputHandler.h:101

TMVA::DataLoader
Definition: DataLoader.h:52

TMVA::DataLoader::PrepareTrainingAndTestTree
void PrepareTrainingAndTestTree(const TCut &cut, const TString &splitOpt)
prepare the training and test trees -> same cuts for signal and background
Definition: DataLoader.cxx:617

TMVA::DataLoader::GetDataSetInfo
DataSetInfo & GetDataSetInfo()
Definition: DataLoader.cxx:123

TMVA::DataLoader::AddVariable
void AddVariable(const TString &expression, const TString &title, const TString &unit, char type='F', Double_t min=0, Double_t max=0)
user inserts discriminating variable in data set info
Definition: DataLoader.cxx:470

TMVA::DataSetInfo
Class that contains all the data information.
Definition: DataSetInfo.h:60

TMVA::DataSetInfo::GetNVariables
UInt_t GetNVariables() const
Definition: DataSetInfo.h:125

TMVA::DataSetInfo::GetName
virtual const char * GetName() const
Returns name of object.
Definition: DataSetInfo.h:69

TMVA::DataSetInfo::CorrelationMatrix
const TMatrixD * CorrelationMatrix(const TString &className) const
Definition: DataSetInfo.cxx:203

TMVA::DataSetInfo::GetNClasses
UInt_t GetNClasses() const
Definition: DataSetInfo.h:153

TMVA::DataSetInfo::GetSplitOptions
const TString & GetSplitOptions() const
Definition: DataSetInfo.h:184

TMVA::DataSetInfo::GetNTargets
UInt_t GetNTargets() const
Definition: DataSetInfo.h:126

TMVA::DataSetInfo::GetDataSet
DataSet * GetDataSet() const
returns data set
Definition: DataSetInfo.cxx:486

TMVA::DataSetInfo::CreateCorrelationMatrixHist
TH2 * CreateCorrelationMatrixHist(const TMatrixD *m, const TString &hName, const TString &hTitle) const
Definition: DataSetInfo.cxx:422

TMVA::DataSetInfo::GetListOfVariables
std::vector< TString > GetListOfVariables() const
returns list of variables
Definition: DataSetInfo.cxx:399

TMVA::DataSetInfo::GetClassInfo
ClassInfo * GetClassInfo(Int_t clNum) const
Definition: DataSetInfo.cxx:152

TMVA::DataSetInfo::GetCut
const TCut & GetCut(Int_t i) const
Definition: DataSetInfo.h:166

TMVA::DataSetInfo::GetVariableInfo
VariableInfo & GetVariableInfo(Int_t i)
Definition: DataSetInfo.h:103

TMVA::DataSetInfo::IsSignal
Bool_t IsSignal(const Event *ev) const
Definition: DataSetInfo.cxx:173

TMVA::DataSetInfo::GetDataSetManager
DataSetManager * GetDataSetManager()
Definition: DataSetInfo.h:192

TMVA::DataSetManager::DataInput
DataInputHandler & DataInput()
Definition: DataSetManager.h:76

TMVA::DataSet
Class that contains all the data information.
Definition: DataSet.h:69

TMVA::DataSet::GetNEvtSigTest
Long64_t GetNEvtSigTest()
return number of signal test events in dataset
Definition: DataSet.cxx:427

TMVA::DataSet::GetTree
TTree * GetTree(Types::ETreeType type)
create the test/trainings tree with all the variables, the weights, the classes, the targets,...
Definition: DataSet.cxx:609

TMVA::DataSet::GetEvent
const Event * GetEvent() const
Definition: DataSet.cxx:202

TMVA::DataSet::GetNEvents
Long64_t GetNEvents(Types::ETreeType type=Types::kMaxTreeType) const
Definition: DataSet.h:217

TMVA::DataSet::GetResults
Results * GetResults(const TString &, Types::ETreeType type, Types::EAnalysisType analysistype)
Definition: DataSet.cxx:265

TMVA::DataSet::GetNTrainingEvents
Long64_t GetNTrainingEvents() const
Definition: DataSet.h:79

TMVA::DataSet::SetCurrentType
void SetCurrentType(Types::ETreeType type) const
Definition: DataSet.h:100

TMVA::DataSet::GetEventCollection
const std::vector< Event * > & GetEventCollection(Types::ETreeType type=Types::kMaxTreeType) const
Definition: DataSet.h:227

TMVA::DataSet::GetNEvtBkgdTest
Long64_t GetNEvtBkgdTest()
return number of background test events in dataset
Definition: DataSet.cxx:435

TMVA::Event
Definition: Event.h:51

TMVA::Event::GetValue
Float_t GetValue(UInt_t ivar) const
return value of i'th variable
Definition: Event.cxx:237

TMVA::Event::SetIsTraining
static void SetIsTraining(Bool_t)
when this static function is called, it sets the flag whether events with negative event weight shoul...
Definition: Event.cxx:392

TMVA::Factory
This is the main MVA steering class.
Definition: Factory.h:81

TMVA::Factory::PrintHelpMessage
void PrintHelpMessage(const TString &datasetname, const TString &methodTitle="") const
Print predefined help message of classifier.
Definition: Factory.cxx:1308

TMVA::Factory::GetROCIntegral
Double_t GetROCIntegral(DataLoader *loader, TString theMethodName, UInt_t iClass=0)
Calculate the integral of the ROC curve, also known as the area under curve (AUC),...
Definition: Factory.cxx:843

TMVA::Factory::fCorrelations
Bool_t fCorrelations
verbosity level, controls granularity of logging
Definition: Factory.h:212

TMVA::Factory::MVector
std::vector< IMethod * > MVector
Definition: Factory.h:85

TMVA::Factory::TrainAllMethods
void TrainAllMethods()
Iterates through all booked methods and calls training.
Definition: Factory.cxx:1094

TMVA::Factory::Verbose
Bool_t Verbose(void) const
Definition: Factory.h:135

TMVA::Factory::WriteDataInformation
void WriteDataInformation(DataSetInfo &fDataSetInfo)
Definition: Factory.cxx:597

TMVA::Factory::BookMethod
MethodBase * BookMethod(DataLoader *loader, TString theMethodName, TString methodTitle, TString theOption="")
Book a classifier or regression method.
Definition: Factory.cxx:346

TMVA::Factory::Factory
Factory(TString theJobName, TFile *theTargetFile, TString theOption="")
Standard constructor.
Definition: Factory.cxx:119

TMVA::Factory::TestAllMethods
void TestAllMethods()
Evaluates all booked methods on the testing data and adds the output to the Results in the corresponi...
Definition: Factory.cxx:1245

TMVA::Factory::fVerbose
Bool_t fVerbose
list of transformations to test
Definition: Factory.h:210

TMVA::Factory::EvaluateAllMethods
void EvaluateAllMethods(void)
Iterates over all MVAs that have been booked, and calls their evaluation methods.
Definition: Factory.cxx:1350

TMVA::Factory::EvaluateImportanceRandom
TH1F * EvaluateImportanceRandom(DataLoader *loader, UInt_t nseeds, Types::EMVA theMethod, TString methodTitle, const char *theOption="")
Definition: Factory.cxx:2390

TMVA::Factory::GetImportance
TH1F * GetImportance(const int nbits, std::vector< Double_t > importances, std::vector< TString > varNames)
Definition: Factory.cxx:2502

TMVA::Factory::fROC
Bool_t fROC
enable to calculate corelations
Definition: Factory.h:213

TMVA::Factory::EvaluateAllVariables
void EvaluateAllVariables(DataLoader *loader, TString options="")
Iterates over all MVA input variables and evaluates them.
Definition: Factory.cxx:1335

TMVA::Factory::fVerboseLevel
TString fVerboseLevel
verbose mode
Definition: Factory.h:211

TMVA::Factory::EvaluateImportance
TH1F * EvaluateImportance(DataLoader *loader, VIType vitype, Types::EMVA theMethod, TString methodTitle, const char *theOption="")
Evaluate Variable Importance.
Definition: Factory.cxx:2166

TMVA::Factory::~Factory
virtual ~Factory()
Destructor.
Definition: Factory.cxx:300

TMVA::Factory::GetROCCurve
TGraph * GetROCCurve(DataLoader *loader, TString theMethodName, Bool_t setTitles=kTRUE, UInt_t iClass=0)
Argument iClass specifies the class to generate the ROC curve in a multiclass setting.
Definition: Factory.cxx:904

TMVA::Factory::MakeClass
virtual void MakeClass(const TString &datasetname, const TString &methodTitle="") const
Definition: Factory.cxx:1280

TMVA::Factory::BookMethodWeightfile
MethodBase * BookMethodWeightfile(DataLoader *dataloader, TMVA::Types::EMVA methodType, const TString &weightfile)
Adds an already constructed method to be managed by this factory.
Definition: Factory.cxx:498

TMVA::Factory::fModelPersistence
Bool_t fModelPersistence
the training type
Definition: Factory.h:219

TMVA::Factory::OptimizeAllMethods
std::map< TString, Double_t > OptimizeAllMethods(TString fomType="ROCIntegral", TString fitType="FitGA")
Iterates through all booked methods and sees if they use parameter tuning and if so.
Definition: Factory.cxx:695

TMVA::Factory::GetROC
ROCCurve * GetROC(DataLoader *loader, TString theMethodName, UInt_t iClass=0, Types::ETreeType type=Types::kTesting)
Private method to generate a ROCCurve instance for a given method.
Definition: Factory.cxx:744

TMVA::Factory::EvaluateImportanceShort
TH1F * EvaluateImportanceShort(DataLoader *loader, Types::EMVA theMethod, TString methodTitle, const char *theOption="")
Definition: Factory.cxx:2285

TMVA::Factory::fAnalysisType
Types::EAnalysisType fAnalysisType
jobname, used as extension in weight file names
Definition: Factory.h:218

TMVA::Factory::HasMethod
Bool_t HasMethod(const TString &datasetname, const TString &title) const
Checks whether a given method name is defined for a given dataset.
Definition: Factory.cxx:580

TMVA::Factory::EvaluateImportanceAll
TH1F * EvaluateImportanceAll(DataLoader *loader, Types::EMVA theMethod, TString methodTitle, const char *theOption="")
Definition: Factory.cxx:2189

TMVA::Factory::SetVerbose
void SetVerbose(Bool_t v=kTRUE)
Definition: Factory.cxx:338

TMVA::Factory::fgTargetFile
TFile * fgTargetFile
Definition: Factory.h:202

TMVA::Factory::GetMethod
IMethod * GetMethod(const TString &datasetname, const TString &title) const
Returns pointer to MVA that corresponds to given method title.
Definition: Factory.cxx:562

TMVA::Factory::DeleteAllMethods
void DeleteAllMethods(void)
Delete methods.
Definition: Factory.cxx:318

TMVA::Factory::fTransformations
TString fTransformations
option string given by construction (presently only "V")
Definition: Factory.h:209

TMVA::Factory::Greetings
void Greetings()
Print welcome message.
Definition: Factory.cxx:290

TMVA::Factory::GetROCCurveAsMultiGraph
TMultiGraph * GetROCCurveAsMultiGraph(DataLoader *loader, UInt_t iClass)
Generate a collection of graphs, for all methods for a given class.
Definition: Factory.cxx:973

TMVA::IMethod
Interface for all concrete MVA method implementations.
Definition: IMethod.h:54

TMVA::IMethod::PrintHelpMessage
virtual void PrintHelpMessage() const =0

TMVA::IMethod::HasAnalysisType
virtual Bool_t HasAnalysisType(Types::EAnalysisType type, UInt_t numberClasses, UInt_t numberTargets)=0

TMVA::IMethod::MakeClass
virtual void MakeClass(const TString &classFileName=TString("")) const =0

TMVA::MethodBase
Virtual base Class for all MVA method.
Definition: MethodBase.h:111

TMVA::MethodBase::GetSeparation
virtual Double_t GetSeparation(TH1 *, TH1 *) const
compute "separation" defined as
Definition: MethodBase.cxx:2780

TMVA::MethodBase::SetSilentFile
void SetSilentFile(Bool_t status)
Definition: MethodBase.h:377

TMVA::MethodBase::SetWeightFileDir
void SetWeightFileDir(TString fileDir)
set directory of weight file
Definition: MethodBase.cxx:2050

TMVA::MethodBase::TestRegression
virtual void TestRegression(Double_t &bias, Double_t &biasT, Double_t &dev, Double_t &devT, Double_t &rms, Double_t &rmsT, Double_t &mInf, Double_t &mInfT, Double_t &corr, Types::ETreeType type)
calculate <sum-of-deviation-squared> of regression output versus "true" value from test sample
Definition: MethodBase.cxx:982

TMVA::MethodBase::DeclareCompatibilityOptions
virtual void DeclareCompatibilityOptions()
options that are used ONLY for the READER to ensure backward compatibility they are hence without any...
Definition: MethodBase.cxx:601

TMVA::MethodBase::GetMethodTypeName
TString GetMethodTypeName() const
Definition: MethodBase.h:331

TMVA::MethodBase::DoMulticlass
Bool_t DoMulticlass() const
Definition: MethodBase.h:439

TMVA::MethodBase::GetSignificance
virtual Double_t GetSignificance() const
compute significance of mean difference
Definition: MethodBase.cxx:2767

TMVA::MethodBase::GetName
const char * GetName() const
Definition: MethodBase.h:333

TMVA::MethodBase::GetAnalysisType
Types::EAnalysisType GetAnalysisType() const
Definition: MethodBase.h:437

TMVA::MethodBase::GetMulticlassConfusionMatrix
virtual TMatrixD GetMulticlassConfusionMatrix(Double_t effB, Types::ETreeType type)
Construct a confusion matrix for a multiclass classifier.
Definition: MethodBase.cxx:2741

TMVA::MethodBase::PrintHelpMessage
void PrintHelpMessage() const
prints out method-specific help method
Definition: MethodBase.cxx:3259

TMVA::MethodBase::TrainMethod
void TrainMethod()
Definition: MethodBase.cxx:655

TMVA::MethodBase::WriteEvaluationHistosToFile
virtual void WriteEvaluationHistosToFile(Types::ETreeType treetype)
writes all MVA evaluation histograms to file
Definition: MethodBase.cxx:2085

TMVA::MethodBase::TestMulticlass
virtual void TestMulticlass()
test multiclass classification
Definition: MethodBase.cxx:1089

TMVA::MethodBase::SetupMethod
void SetupMethod()
setup of methods
Definition: MethodBase.cxx:411

TMVA::MethodBase::GetEfficiency
virtual Double_t GetEfficiency(const TString &, Types::ETreeType, Double_t &err)
fill background efficiency (resp.
Definition: MethodBase.cxx:2293

TMVA::MethodBase::SetAnalysisType
virtual void SetAnalysisType(Types::EAnalysisType type)
Definition: MethodBase.h:436

TMVA::MethodBase::GetMethodName
const TString & GetMethodName() const
Definition: MethodBase.h:330

TMVA::MethodBase::DoRegression
Bool_t DoRegression() const
Definition: MethodBase.h:438

TMVA::MethodBase::ProcessSetup
void ProcessSetup()
process all options the "CheckForUnusedOptions" is done in an independent call, since it may be overr...
Definition: MethodBase.cxx:428

TMVA::MethodBase::GetTrainingEfficiency
virtual Double_t GetTrainingEfficiency(const TString &)
Definition: MethodBase.cxx:2519

TMVA::MethodBase::DataInfo
DataSetInfo & DataInfo() const
Definition: MethodBase.h:409

TMVA::MethodBase::MakeClass
virtual void MakeClass(const TString &classFileName=TString("")) const
create reader class for method (classification only at present)
Definition: MethodBase.cxx:2998

TMVA::MethodBase::TestClassification
virtual void TestClassification()
initialization
Definition: MethodBase.cxx:1116

TMVA::MethodBase::AddOutput
void AddOutput(Types::ETreeType type, Types::EAnalysisType analysisType)
Definition: MethodBase.cxx:1306

TMVA::MethodBase::ReadStateFromFile
void ReadStateFromFile()
Function to write options and weights to file.
Definition: MethodBase.cxx:1417

TMVA::MethodBase::OptimizeTuningParameters
virtual std::map< TString, Double_t > OptimizeTuningParameters(TString fomType="ROCIntegral", TString fitType="FitGA")
call the Optimizer with the set of parameters and ranges that are meant to be tuned.
Definition: MethodBase.cxx:628

TMVA::MethodBase::fDataSetInfo
DataSetInfo & fDataSetInfo
Definition: MethodBase.h:605

TMVA::MethodBase::GetMethodType
Types::EMVA GetMethodType() const
Definition: MethodBase.h:332

TMVA::MethodBase::SetFile
void SetFile(TFile *file)
Definition: MethodBase.h:374

TMVA::MethodBase::Data
DataSet * Data() const
Definition: MethodBase.h:408

TMVA::MethodBase::SetModelPersistence
void SetModelPersistence(Bool_t status)
Definition: MethodBase.h:381

TMVA::MethodBase::GetROCIntegral
virtual Double_t GetROCIntegral(TH1D *histS, TH1D *histB) const
calculate the area (integral) under the ROC curve as a overall quality measure of the classification
Definition: MethodBase.cxx:2813

TMVA::MethodBase::CheckSetup
virtual void CheckSetup()
check may be overridden by derived class (sometimes, eg, fitters are used which can only be implement...
Definition: MethodBase.cxx:438

TMVA::MethodBoost
Class for boosting a TMVA method.
Definition: MethodBoost.h:58

TMVA::MethodBoost::SetBoostedMethodName
void SetBoostedMethodName(TString methodName)
Definition: MethodBoost.h:86

TMVA::MethodBoost::fDataSetManager
DataSetManager * fDataSetManager
Definition: MethodBoost.h:193

TMVA::MethodCategory
Class for categorizing the phase space.
Definition: MethodCategory.h:58

TMVA::MethodCategory::fDataSetManager
DataSetManager * fDataSetManager
Definition: MethodCategory.h:131

TMVA::MsgLogger
ostringstream derivative to redirect and format output
Definition: MsgLogger.h:59

TMVA::MsgLogger::SetMinType
void SetMinType(EMsgType minType)
Definition: MsgLogger.h:72

TMVA::MsgLogger::SetSource
void SetSource(const std::string &source)
Definition: MsgLogger.h:70

TMVA::MsgLogger::InhibitOutput
static void InhibitOutput()
Definition: MsgLogger.cxx:74

TMVA::ROCCurve
Definition: ROCCurve.h:47

TMVA::ROCCurve::GetEffSForEffB
Double_t GetEffSForEffB(Double_t effB, const UInt_t num_points=41)
Calculate the signal efficiency (sensitivity) for a given background efficiency (sensitivity).
Definition: ROCCurve.cxx:220

TMVA::ROCCurve::GetROCIntegral
Double_t GetROCIntegral(const UInt_t points=41)
Calculates the ROC integral (AUC)
Definition: ROCCurve.cxx:251

TMVA::ROCCurve::GetROCCurve
TGraph * GetROCCurve(const UInt_t points=100)
Returns a new TGraph containing the ROC curve.
Definition: ROCCurve.cxx:277

TMVA::Ranking
Ranking for variables in method (implementation)
Definition: Ranking.h:48

TMVA::Ranking::Print
virtual void Print() const
get maximum length of variable names
Definition: Ranking.cxx:111

TMVA::ResultsClassification
Class that is the base-class for a vector of result.
Definition: ResultsClassification.h:48

TMVA::ResultsMulticlass
Class which takes the results of a multiclass classification.
Definition: ResultsMulticlass.h:55

TMVA::Results
Class that is the base-class for a vector of result.
Definition: Results.h:57

TMVA::Tools::FormattedOutput
void FormattedOutput(const std::vector< Double_t > &, const std::vector< TString > &, const TString titleVars, const TString titleValues, MsgLogger &logger, TString format="%+1.3f")
formatted output of simple table
Definition: Tools.cxx:899

TMVA::Tools::UsefulSortDescending
void UsefulSortDescending(std::vector< std::vector< Double_t > > &, std::vector< TString > *vs=0)
sort 2D vector (AND in parallel a TString vector) in such a way that the "first vector is sorted" and...
Definition: Tools.cxx:576

TMVA::Tools::ROOTVersionMessage
void ROOTVersionMessage(MsgLogger &logger)
prints the ROOT release number and date
Definition: Tools.cxx:1337

TMVA::Tools::SplitString
std::vector< TString > SplitString(const TString &theOpt, const char separator) const
splits the option string at 'separator' and fills the list 'splitV' with the primitive strings
Definition: Tools.cxx:1211

TMVA::Tools::Color
const TString & Color(const TString &)
human readable color strings
Definition: Tools.cxx:840

TMVA::Tools::GetCorrelationMatrix
const TMatrixD * GetCorrelationMatrix(const TMatrixD *covMat)
turns covariance into correlation matrix
Definition: Tools.cxx:336

TMVA::Tools::kHtmlLink
@ kHtmlLink
Definition: Tools.h:216

TMVA::Tools::TMVACitation
void TMVACitation(MsgLogger &logger, ECitation citType=kPlainText)
kinds of TMVA citation
Definition: Tools.cxx:1453

TMVA::Tools::TMVAVersionMessage
void TMVAVersionMessage(MsgLogger &logger)
prints the TMVA release number and date
Definition: Tools.cxx:1328

TMVA::Tools::TMVAWelcomeMessage
void TMVAWelcomeMessage()
direct output, eg, when starting ROOT session -> no use of Logger here
Definition: Tools.cxx:1314

TMVA::Tools::UsefulSortAscending
void UsefulSortAscending(std::vector< std::vector< Double_t > > &, std::vector< TString > *vs=0)
sort 2D vector (AND in parallel a TString vector) in such a way that the "first vector is sorted" and...
Definition: Tools.cxx:550

TMVA::TransformationHandler
Class that contains all the data information.
Definition: TransformationHandler.h:55

TMVA::TransformationHandler::PrintVariableRanking
void PrintVariableRanking() const
prints ranking of input variables
Definition: TransformationHandler.cxx:924

TMVA::Types
Singleton class for Global types used by TMVA.
Definition: Types.h:73

TMVA::Types::Instance
static Types & Instance()
the the single instance of "Types" if existing already, or create it (Singleton)
Definition: Types.cxx:70

TMVA::Types::EMVA
EMVA
Definition: Types.h:78

TMVA::Types::kCategory
@ kCategory
Definition: Types.h:99

TMVA::Types::kCuts
@ kCuts
Definition: Types.h:80

TMVA::Types::EAnalysisType
EAnalysisType
Definition: Types.h:127

TMVA::Types::kMulticlass
@ kMulticlass
Definition: Types.h:130

TMVA::Types::kNoAnalysisType
@ kNoAnalysisType
Definition: Types.h:131

TMVA::Types::kClassification
@ kClassification
Definition: Types.h:128

TMVA::Types::kMaxAnalysisType
@ kMaxAnalysisType
Definition: Types.h:132

TMVA::Types::kRegression
@ kRegression
Definition: Types.h:129

TMVA::Types::ETreeType
ETreeType
Definition: Types.h:143

TMVA::Types::kTraining
@ kTraining
Definition: Types.h:144

TMVA::Types::kTesting
@ kTesting
Definition: Types.h:145

TMVA::VariableInfo::GetLabel
const TString & GetLabel() const
Definition: VariableInfo.h:59

TMatrixT< Double_t >

TMultiGraph
A TMultiGraph is a collection of TGraph (or derived) objects.
Definition: TMultiGraph.h:35

TMultiGraph::GetListOfGraphs
TList * GetListOfGraphs() const
Definition: TMultiGraph.h:69

TMultiGraph::Add
virtual void Add(TGraph *graph, Option_t *chopt="")
Add a new graph to the list of graphs.
Definition: TMultiGraph.cxx:452

TMultiGraph::GetHistogram
TH1F * GetHistogram()
Returns a pointer to the histogram used to draw the axis.
Definition: TMultiGraph.cxx:1050

TMultiGraph::Draw
virtual void Draw(Option_t *chopt="")
Draw this multigraph with its current attributes.
Definition: TMultiGraph.cxx:542

TMultiGraph::GetYaxis
TAxis * GetYaxis()
Get y axis of the graph.
Definition: TMultiGraph.cxx:1132

TMultiGraph::GetXaxis
TAxis * GetXaxis()
Get x axis of the graph.
Definition: TMultiGraph.cxx:1120

TNamed::SetTitle
virtual void SetTitle(const char *title="")
Set the title of the TNamed.
Definition: TNamed.cxx:164

TNamed::fName
TString fName
Definition: TNamed.h:32

TNamed::Clone
virtual TObject * Clone(const char *newname="") const
Make a clone of an object using the Streamer facility.
Definition: TNamed.cxx:74

TNamed::GetName
virtual const char * GetName() const
Returns name of object.
Definition: TNamed.h:47

TObject::kOverwrite
@ kOverwrite
overwrite existing object with same name
Definition: TObject.h:88

TPad::BuildLegend
virtual TLegend * BuildLegend(Double_t x1=0.3, Double_t y1=0.21, Double_t x2=0.3, Double_t y2=0.21, const char *title="", Option_t *option="")
Build a legend from the graphical objects in the pad.
Definition: TPad.cxx:491

TPad::SetGrid
virtual void SetGrid(Int_t valuex=1, Int_t valuey=1)
Definition: TPad.h:330

TPrincipal
Principal Components Analysis (PCA)
Definition: TPrincipal.h:20

TPrincipal::AddRow
virtual void AddRow(const Double_t *x)
Add a data point and update the covariance matrix.
Definition: TPrincipal.cxx:410

TPrincipal::GetCovarianceMatrix
const TMatrixD * GetCovarianceMatrix() const
Definition: TPrincipal.h:58

TPrincipal::MakePrincipals
virtual void MakePrincipals()
Perform the principal components analysis.
Definition: TPrincipal.cxx:869

TRandom3
Random number generator class based on M.
Definition: TRandom3.h:27

TString
Basic string class.
Definition: TString.h:131

TString::Length
Ssiz_t Length() const
Definition: TString.h:405

TString::ToLower
void ToLower()
Change string to lower-case.
Definition: TString.cxx:1125

TString::CompareTo
int CompareTo(const char *cs, ECaseCompare cmp=kExact) const
Compare a string to char *cs2.
Definition: TString.cxx:418

TString::Data
const char * Data() const
Definition: TString.h:364

TString::ReplaceAll
TString & ReplaceAll(const TString &s1, const TString &s2)
Definition: TString.h:687

TString::BeginsWith
Bool_t BeginsWith(const char *s, ECaseCompare cmp=kExact) const
Definition: TString.h:610

TString::IsNull
Bool_t IsNull() const
Definition: TString.h:402

TString::Contains
Bool_t Contains(const char *pat, ECaseCompare cmp=kExact) const
Definition: TString.h:619

TStyle::SetOptStat
void SetOptStat(Int_t stat=1)
The type of information printed in the histogram statistics box can be selected via the parameter mod...
Definition: TStyle.cxx:1450

TStyle::SetTitleXOffset
void SetTitleXOffset(Float_t offset=1)
Definition: TStyle.h:387

TSystem::MakeDirectory
virtual int MakeDirectory(const char *name)
Make a directory.
Definition: TSystem.cxx:835

TTree::Write
virtual Int_t Write(const char *name=0, Int_t option=0, Int_t bufsize=0)
Write this object to the current directory.
Definition: TTree.cxx:9485

y
Double_t y[n]
Definition: legend1.C:17

x
Double_t x[n]
Definition: legend1.C:17

n
const Int_t n
Definition: legend1.C:16

Cppyy::GetMethodName
std::string GetMethodName(TCppMethod_t)
Definition: Cppyy.cxx:757

Cppyy::GetMethod
TCppMethod_t GetMethod(TCppScope_t scope, TCppIndex_t imeth)
Definition: Cppyy.cxx:751

ROOT::Math::detail::sep
@ sep
Definition: GenVectorIO.h:35

TGeant4Unit::s
static constexpr double s
Definition: TGeant4SystemOfUnits.h:162

TMVA::DataLoaderCopy
void DataLoaderCopy(TMVA::DataLoader *des, TMVA::DataLoader *src)

TMVA::gConfig
Config & gConfig()

TMVA::gTools
Tools & gTools()

TMVA::CreateVariableTransforms
void CreateVariableTransforms(const TString &trafoDefinition, TMVA::DataSetInfo &dataInfo, TMVA::TransformationHandler &transformationHandler, TMVA::MsgLogger &log)
Definition: VariableTransform.cxx:67

TMVA::Endl
MsgLogger & Endl(MsgLogger &ml)
Definition: MsgLogger.h:158

TMath::IsNaN
Bool_t IsNaN(Double_t x)
Definition: TMath.h:882

TMath::Log
Double_t Log(Double_t x)
Definition: TMath.h:750

graph
Definition: graph.py:1

v
@ v
Definition: rootcling_impl.cxx:3622

m
auto * m
Definition: textangle.C:8

Factory.h

Types.h

VIBITS
#define VIBITS
Definition: Factory.cxx:107

sum
static long int sum(long int i)
Definition: Factory.cxx:2276

MinNoTrainingEvents
const Int_t MinNoTrainingEvents
Definition: Factory.cxx:99

READXML
#define READXML
Definition: Factory.cxx:104