doc/hackathon/MethodPyRandomForest_8cxx_source.html

// @(#)root/tmva/pymva $Id$

// Authors: Omar Zapata, Lorenzo Moneta, Sergei Gleyzer 2015


/**********************************************************************************

 * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

 * Package: TMVA                                                                  *

 * Class  : MethodPyRandomForest                                                  *

 * Web    : http://oproject.org                                                   *

 *                                                                                *

 * Description:                                                                   *

 *      Random Forest Classifiear from Scikit learn                               *

 *                                                                                *

 *                                                                                *

 * Redistribution and use in source and binary forms, with or without             *

 * modification, are permitted according to the terms listed in LICENSE           *

 * (see tmva/doc/LICENSE)                                          *

 *                                                                                *

 **********************************************************************************/

#include <Python.h>    // Needs to be included first to avoid redefinition of _POSIX_C_SOURCE

#include "TMVA/MethodPyRandomForest.h"


#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION

#include <numpy/arrayobject.h>


#include "TMVA/Configurable.h"

#include "TMVA/ClassifierFactory.h"

#include "TMVA/Config.h"

#include "TMVA/DataSet.h"

#include "TMVA/Event.h"

#include "TMVA/IMethod.h"

#include "TMVA/MsgLogger.h"

#include "TMVA/PDF.h"

#include "TMVA/Ranking.h"

#include "TMVA/Results.h"

#include "TMVA/Tools.h"

#include "TMVA/Types.h"

#include "TMVA/Timer.h"

#include "TMVA/VariableTransformBase.h"


#include "TMatrix.h"


using namespace TMVA;


namespace TMVA {

namespace Internal {

class PyGILRAII {

   PyGILState_STATE m_GILState;


public:

   PyGILRAII() : m_GILState(PyGILState_Ensure()) {}

   ~PyGILRAII() { PyGILState_Release(m_GILState); }

};

} // namespace Internal

} // namespace TMVA


REGISTER_METHOD(PyRandomForest)


//_______________________________________________________________________


MethodPyRandomForest::MethodPyRandomForest(const TString &jobName,

      const TString &methodTitle,

      DataSetInfo &dsi,

      const TString &theOption) :

   PyMethodBase(jobName, Types::kPyRandomForest, methodTitle, dsi, theOption),

   fNestimators(10),

   fCriterion("gini"),

   fMaxDepth("None"),

   fMinSamplesSplit(2),

   fMinSamplesLeaf(1),

   fMinWeightFractionLeaf(0),

   fMaxFeatures("'sqrt'"),

   fMaxLeafNodes("None"),

   fBootstrap(kTRUE),

   fOobScore(kFALSE),

   fNjobs(1),

   fRandomState("None"),

   fVerbose(0),

   fWarmStart(kFALSE),

   fClassWeight("None")

{

}


//_______________________________________________________________________


MethodPyRandomForest::MethodPyRandomForest(DataSetInfo &theData, const TString &theWeightFile)

   : PyMethodBase(Types::kPyRandomForest, theData, theWeightFile),

   fNestimators(10),

   fCriterion("gini"),

   fMaxDepth("None"),

   fMinSamplesSplit(2),

   fMinSamplesLeaf(1),

   fMinWeightFractionLeaf(0),

   fMaxFeatures("'sqrt'"),

   fMaxLeafNodes("None"),

   fBootstrap(kTRUE),

   fOobScore(kFALSE),

   fNjobs(1),

   fRandomState("None"),

   fVerbose(0),

   fWarmStart(kFALSE),

   fClassWeight("None")

{

}


//_______________________________________________________________________


MethodPyRandomForest::~MethodPyRandomForest(void)

{

}


//_______________________________________________________________________


Bool_t MethodPyRandomForest::HasAnalysisType(Types::EAnalysisType type, UInt_t numberClasses, UInt_t)

{

   if (type == Types::kClassification && numberClasses == 2) return kTRUE;

   if (type == Types::kMulticlass && numberClasses >= 2) return kTRUE;

   return kFALSE;

}


//_______________________________________________________________________


void MethodPyRandomForest::DeclareOptions()

{

   MethodBase::DeclareCompatibilityOptions();


   DeclareOptionRef(fNestimators, "NEstimators", "Integer, optional (default=10). The number of trees in the forest.");

   DeclareOptionRef(fCriterion, "Criterion", "String, optional (default='gini') \

      The function to measure the quality of a split. Supported criteria are \

      'gini' for the Gini impurity and 'entropy' for the information gain. \

      Note: this parameter is tree-specific.");


   DeclareOptionRef(fMaxDepth, "MaxDepth", "integer or None, optional (default=None) \

      The maximum depth of the tree. If None, then nodes are expanded until \

      all leaves are pure or until all leaves contain less than \

      min_samples_split samples. \

      Ignored if ``max_leaf_nodes`` is not None.");


   DeclareOptionRef(fMinSamplesSplit, "MinSamplesSplit", "integer, optional (default=2)\

      The minimum number of samples required to split an internal node.");


   DeclareOptionRef(fMinSamplesLeaf, "MinSamplesLeaf", "integer, optional (default=1) \

      The minimum number of samples in newly created leaves.  A split is \

      discarded if after the split, one of the leaves would contain less then \

      ``min_samples_leaf`` samples.");

   DeclareOptionRef(fMinWeightFractionLeaf, "MinWeightFractionLeaf", "//float, optional (default=0.) \

      The minimum weighted fraction of the input samples required to be at a \

      leaf node.");

   DeclareOptionRef(fMaxFeatures, "MaxFeatures", "The number of features to consider when looking for the best split");


   DeclareOptionRef(fMaxLeafNodes, "MaxLeafNodes", "int or None, optional (default=None)\

      Grow trees with ``max_leaf_nodes`` in best-first fashion.\

      Best nodes are defined as relative reduction in impurity.\

      If None then unlimited number of leaf nodes.\

      If not None then ``max_depth`` will be ignored.");


   DeclareOptionRef(fBootstrap, "Bootstrap", "boolean, optional (default=True) \

      Whether bootstrap samples are used when building trees.");


   DeclareOptionRef(fOobScore, "OoBScore", " bool Whether to use out-of-bag samples to estimate\

      the generalization error.");


   DeclareOptionRef(fNjobs, "NJobs", " integer, optional (default=1) \

      The number of jobs to run in parallel for both `fit` and `predict`. \

      If -1, then the number of jobs is set to the number of cores.");


   DeclareOptionRef(fRandomState, "RandomState", "int, RandomState instance or None, optional (default=None)\

      If int, random_state is the seed used by the random number generator;\

      If RandomState instance, random_state is the random number generator;\

      If None, the random number generator is the RandomState instance used\

      by `np.random`.");


   DeclareOptionRef(fVerbose, "Verbose", "int, optional (default=0)\

      Controls the verbosity of the tree building process.");


   DeclareOptionRef(fWarmStart, "WarmStart", "bool, optional (default=False)\

      When set to ``True``, reuse the solution of the previous call to fit\

      and add more estimators to the ensemble, otherwise, just fit a whole\

      new forest.");


   DeclareOptionRef(fClassWeight, "ClassWeight", "dict, list of dicts, \"auto\", \"subsample\" or None, optional\

      Weights associated with classes in the form ``{class_label: weight}``.\

      If not given, all classes are supposed to have weight one. For\

      multi-output problems, a list of dicts can be provided in the same\

      order as the columns of y.\

      The \"auto\" mode uses the values of y to automatically adjust\

      weights inversely proportional to class frequencies in the input data.\

      The \"subsample\" mode is the same as \"auto\" except that weights are\

      computed based on the bootstrap sample for every tree grown.\

      For multi-output, the weights of each column of y will be multiplied.\

      Note that these weights will be multiplied with sample_weight (passed\

      through the fit method) if sample_weight is specified.");


   DeclareOptionRef(fFilenameClassifier, "FilenameClassifier",

      "Store trained classifier in this file");

}


//_______________________________________________________________________

// Check options and load them to local python namespace


void MethodPyRandomForest::ProcessOptions()

{

   if (fNestimators <= 0) {

      Log() << kFATAL << " NEstimators <=0... that does not work !! " << Endl;

   }

   pNestimators = Eval(Form("%i", fNestimators));

   PyDict_SetItemString(fLocalNS, "nEstimators", pNestimators);


   if (fCriterion != "gini" && fCriterion != "entropy") {

      Log() << kFATAL << Form(" Criterion = %s... that does not work !! ", fCriterion.Data())

            << " The options are `gini` or `entropy`." << Endl;

   }

   pCriterion = Eval(Form("'%s'", fCriterion.Data()));

   PyDict_SetItemString(fLocalNS, "criterion", pCriterion);


   pMaxDepth = Eval(fMaxDepth);

   PyDict_SetItemString(fLocalNS, "maxDepth", pMaxDepth);

   if (!pMaxDepth) {

      Log() << kFATAL << Form(" MaxDepth = %s... that does not work !! ", fMaxDepth.Data())

            << " The options are None or integer." << Endl;

   }


   if (fMinSamplesSplit < 0) {

      Log() << kFATAL << " MinSamplesSplit < 0... that does not work !! " << Endl;

   }

   pMinSamplesSplit = Eval(Form("%i", fMinSamplesSplit));

   PyDict_SetItemString(fLocalNS, "minSamplesSplit", pMinSamplesSplit);


   if (fMinSamplesLeaf < 0) {

      Log() << kFATAL << " MinSamplesLeaf < 0... that does not work !! " << Endl;

   }

   pMinSamplesLeaf = Eval(Form("%i", fMinSamplesLeaf));

   PyDict_SetItemString(fLocalNS, "minSamplesLeaf", pMinSamplesLeaf);


   if (fMinWeightFractionLeaf < 0) {

      Log() << kERROR << " MinWeightFractionLeaf < 0... that does not work !! " << Endl;

   }

   pMinWeightFractionLeaf = Eval(Form("%f", fMinWeightFractionLeaf));

   PyDict_SetItemString(fLocalNS, "minWeightFractionLeaf", pMinWeightFractionLeaf);


   if (fMaxFeatures == "auto") fMaxFeatures = "sqrt"; // change in API from v 1.11

   if (fMaxFeatures == "sqrt" || fMaxFeatures == "log2"){

      fMaxFeatures = Form("'%s'", fMaxFeatures.Data());

   }

   pMaxFeatures = Eval(fMaxFeatures);

   PyDict_SetItemString(fLocalNS, "maxFeatures", pMaxFeatures);


   if (!pMaxFeatures) {

      Log() << kFATAL << Form(" MaxFeatures = %s... that does not work !! ", fMaxFeatures.Data())

            << "int, float, string or None, optional (default='auto')"

            << "The number of features to consider when looking for the best split:"

            << "If int, then consider `max_features` features at each split."

            << "If float, then `max_features` is a percentage and"

            << "`int(max_features * n_features)` features are considered at each split."

            << "If 'auto', then `max_features=sqrt(n_features)`."

            << "If 'sqrt', then `max_features=sqrt(n_features)`."

            << "If 'log2', then `max_features=log2(n_features)`."

            << "If None, then `max_features=n_features`." << Endl;

   }


   pMaxLeafNodes = Eval(fMaxLeafNodes);

   if (!pMaxLeafNodes) {

      Log() << kFATAL << Form(" MaxLeafNodes = %s... that does not work !! ", fMaxLeafNodes.Data())

            << " The options are None or integer." << Endl;

   }

   PyDict_SetItemString(fLocalNS, "maxLeafNodes", pMaxLeafNodes);


   pRandomState = Eval(fRandomState);

   if (!pRandomState) {

      Log() << kFATAL << Form(" RandomState = %s... that does not work !! ", fRandomState.Data())

            << "If int, random_state is the seed used by the random number generator;"

            << "If RandomState instance, random_state is the random number generator;"

            << "If None, the random number generator is the RandomState instance used by `np.random`." << Endl;

   }

   PyDict_SetItemString(fLocalNS, "randomState", pRandomState);


   pClassWeight = Eval(fClassWeight);

   if (!pClassWeight) {

      Log() << kFATAL << Form(" ClassWeight = %s... that does not work !! ", fClassWeight.Data())

            << "dict, list of dicts, 'auto', 'subsample' or None, optional" << Endl;

   }

   PyDict_SetItemString(fLocalNS, "classWeight", pClassWeight);


   if(fNjobs < 1) {

      Log() << kFATAL << Form(" NJobs = %i... that does not work !! ", fNjobs)

            << "Value has to be greater than zero." << Endl;

   }

   pNjobs = Eval(Form("%i", fNjobs));

   PyDict_SetItemString(fLocalNS, "nJobs", pNjobs);


   pBootstrap = (fBootstrap) ? Eval("True") : Eval("False");

   PyDict_SetItemString(fLocalNS, "bootstrap", pBootstrap);

   pOobScore = (fOobScore) ? Eval("True") : Eval("False");

   PyDict_SetItemString(fLocalNS, "oobScore", pOobScore);

   pVerbose = Eval(Form("%i", fVerbose));

   PyDict_SetItemString(fLocalNS, "verbose", pVerbose);

   pWarmStart = (fWarmStart) ? Eval("True") : Eval("False");

   PyDict_SetItemString(fLocalNS, "warmStart", pWarmStart);


   // If no filename is given, set default

   if(fFilenameClassifier.IsNull())

   {

      fFilenameClassifier = GetWeightFileDir() + "/PyRFModel_" + GetName() + ".PyData";

   }

}


//_______________________________________________________________________


void MethodPyRandomForest::Init()

{

   TMVA::Internal::PyGILRAII raii;

   _import_array(); //require to use numpy arrays


   // Check options and load them to local python namespace

   ProcessOptions();


   // Import module for random forest classifier

   PyRunString("import sklearn.ensemble");


   // Get data properties

   fNvars = GetNVariables();

   fNoutputs = DataInfo().GetNClasses();

}


//_______________________________________________________________________


void MethodPyRandomForest::Train()

{

   // Load training data (data, classes, weights) to python arrays

   int fNrowsTraining = Data()->GetNTrainingEvents(); //every row is an event, a class type and a weight

   npy_intp dimsData[2];

   dimsData[0] = fNrowsTraining;

   dimsData[1] = fNvars;

   PyArrayObject * fTrainData = (PyArrayObject *)PyArray_SimpleNew(2, dimsData, NPY_FLOAT);

   PyDict_SetItemString(fLocalNS, "trainData", (PyObject*)fTrainData);

   float *TrainData = (float *)(PyArray_DATA(fTrainData));


   npy_intp dimsClasses = (npy_intp) fNrowsTraining;

   PyArrayObject * fTrainDataClasses = (PyArrayObject *)PyArray_SimpleNew(1, &dimsClasses, NPY_FLOAT);

   PyDict_SetItemString(fLocalNS, "trainDataClasses", (PyObject*)fTrainDataClasses);

   float *TrainDataClasses = (float *)(PyArray_DATA(fTrainDataClasses));


   PyArrayObject * fTrainDataWeights = (PyArrayObject *)PyArray_SimpleNew(1, &dimsClasses, NPY_FLOAT);

   PyDict_SetItemString(fLocalNS, "trainDataWeights", (PyObject*)fTrainDataWeights);

   float *TrainDataWeights = (float *)(PyArray_DATA(fTrainDataWeights));


   for (int i = 0; i < fNrowsTraining; i++) {

      // Fill training data matrix

      const TMVA::Event *e = Data()->GetTrainingEvent(i);

      for (UInt_t j = 0; j < fNvars; j++) {

         TrainData[j + i * fNvars] = e->GetValue(j);

      }


      // Fill target classes

      TrainDataClasses[i] = e->GetClass();


      // Get event weight

      TrainDataWeights[i] = e->GetWeight();

   }


   // Create classifier object

   PyRunString("classifier = sklearn.ensemble.RandomForestClassifier(bootstrap=bootstrap, class_weight=classWeight, criterion=criterion, max_depth=maxDepth, max_features=maxFeatures, max_leaf_nodes=maxLeafNodes, min_samples_leaf=minSamplesLeaf, min_samples_split=minSamplesSplit, min_weight_fraction_leaf=minWeightFractionLeaf, n_estimators=nEstimators, n_jobs=nJobs, oob_score=oobScore, random_state=randomState, verbose=verbose, warm_start=warmStart)",

      "Failed to setup classifier");


   // Fit classifier

   // NOTE: We dump the output to a variable so that the call does not pollute stdout

   PyRunString("dump = classifier.fit(trainData, trainDataClasses, trainDataWeights)", "Failed to train classifier");


   // Store classifier

   fClassifier = PyDict_GetItemString(fLocalNS, "classifier");

   if(fClassifier == 0) {

      Log() << kFATAL << "Can't create classifier object from RandomForestClassifier" << Endl;

      Log() << Endl;

   }


   if (IsModelPersistence()) {

      Log() << Endl;

      Log() << gTools().Color("bold") << "Saving state file: " << gTools().Color("reset") << fFilenameClassifier << Endl;

      Log() << Endl;

      Serialize(fFilenameClassifier, fClassifier);

   }

}


//_______________________________________________________________________


void MethodPyRandomForest::TestClassification()

{

   MethodBase::TestClassification();

}


//_______________________________________________________________________


std::vector<Double_t> MethodPyRandomForest::GetMvaValues(Long64_t firstEvt, Long64_t lastEvt, Bool_t /* logProgress */)

{

   // Load model if not already done

   if (fClassifier == 0) ReadModelFromFile();


   // Determine number of events

   Long64_t nEvents = Data()->GetNEvents();

   if (firstEvt > lastEvt || lastEvt > nEvents) lastEvt = nEvents;

   if (firstEvt < 0) firstEvt = 0;

   nEvents = lastEvt-firstEvt;


   // Get data

   npy_intp dims[2];

   dims[0] = nEvents;

   dims[1] = fNvars;

   PyArrayObject *pEvent= (PyArrayObject *)PyArray_SimpleNew(2, dims, NPY_FLOAT);

   float *pValue = (float *)(PyArray_DATA(pEvent));


   for (Int_t ievt=0; ievt<nEvents; ievt++) {

      Data()->SetCurrentEvent(ievt);

      const TMVA::Event *e = Data()->GetEvent();

      for (UInt_t i = 0; i < fNvars; i++) {

         pValue[ievt * fNvars + i] = e->GetValue(i);

      }

   }


   // Get prediction from classifier

   PyArrayObject *result = (PyArrayObject *)PyObject_CallMethod(fClassifier, const_cast<char *>("predict_proba"), const_cast<char *>("(O)"), pEvent);

   double *proba = (double *)(PyArray_DATA(result));


   // Return signal probabilities

   if(Long64_t(mvaValues.size()) != nEvents) mvaValues.resize(nEvents);

   for (int i = 0; i < nEvents; ++i) {

      mvaValues[i] = proba[fNoutputs*i + TMVA::Types::kSignal];

   }


   Py_DECREF(pEvent);

   Py_DECREF(result);


   return mvaValues;

}


//_______________________________________________________________________


Double_t MethodPyRandomForest::GetMvaValue(Double_t *errLower, Double_t *errUpper)

{

   // cannot determine error

   NoErrorCalc(errLower, errUpper);


   // Load model if not already done

   if (fClassifier == 0) ReadModelFromFile();


   // Get current event and load to python array

   const TMVA::Event *e = Data()->GetEvent();

   npy_intp dims[2];

   dims[0] = 1;

   dims[1] = fNvars;

   PyArrayObject *pEvent= (PyArrayObject *)PyArray_SimpleNew(2, dims, NPY_FLOAT);

   float *pValue = (float *)(PyArray_DATA(pEvent));

   for (UInt_t i = 0; i < fNvars; i++) pValue[i] = e->GetValue(i);


   // Get prediction from classifier

   PyArrayObject *result = (PyArrayObject *)PyObject_CallMethod(fClassifier, const_cast<char *>("predict_proba"), const_cast<char *>("(O)"), pEvent);

   double *proba = (double *)(PyArray_DATA(result));


   // Return MVA value

   Double_t mvaValue;

   mvaValue = proba[TMVA::Types::kSignal]; // getting signal probability


   Py_DECREF(result);

   Py_DECREF(pEvent);


   return mvaValue;

}


//_______________________________________________________________________


std::vector<Float_t>& MethodPyRandomForest::GetMulticlassValues()

{

   // Load model if not already done

   if (fClassifier == 0) ReadModelFromFile();


   // Get current event and load to python array

   const TMVA::Event *e = Data()->GetEvent();

   npy_intp dims[2];

   dims[0] = 1;

   dims[1] = fNvars;

   PyArrayObject *pEvent= (PyArrayObject *)PyArray_SimpleNew(2, dims, NPY_FLOAT);

   float *pValue = (float *)(PyArray_DATA(pEvent));

   for (UInt_t i = 0; i < fNvars; i++) pValue[i] = e->GetValue(i);


   // Get prediction from classifier

   PyArrayObject *result = (PyArrayObject *)PyObject_CallMethod(fClassifier, const_cast<char *>("predict_proba"), const_cast<char *>("(O)"), pEvent);

   double *proba = (double *)(PyArray_DATA(result));


   // Return MVA values

   if(UInt_t(classValues.size()) != fNoutputs) classValues.resize(fNoutputs);

   for(UInt_t i = 0; i < fNoutputs; i++) classValues[i] = proba[i];


   Py_DECREF(pEvent);

   Py_DECREF(result);


   return classValues;

}


//_______________________________________________________________________


void MethodPyRandomForest::ReadModelFromFile()

{

   if (!PyIsInitialized()) {

      PyInitialize();

   }


   Log() << Endl;

   Log() << gTools().Color("bold") << "Loading state file: " << gTools().Color("reset") << fFilenameClassifier << Endl;

   Log() << Endl;


   // Load classifier from file

   Int_t err = UnSerialize(fFilenameClassifier, &fClassifier);

   if(err != 0)

   {

       Log() << kFATAL << Form("Failed to load classifier from file (error code: %i): %s", err, fFilenameClassifier.Data()) << Endl;

   }


   // Book classifier object in python dict

   PyDict_SetItemString(fLocalNS, "classifier", fClassifier);


   // Load data properties

   // NOTE: This has to be repeated here for the reader application

   fNvars = GetNVariables();

   fNoutputs = DataInfo().GetNClasses();

}


//_______________________________________________________________________


const Ranking* MethodPyRandomForest::CreateRanking()

{

   // Get feature importance from classifier as an array with length equal

   // number of variables, higher value signals a higher importance

   PyArrayObject* pRanking = (PyArrayObject*) PyObject_GetAttrString(fClassifier, "feature_importances_");

   if(pRanking == 0) Log() << kFATAL << "Failed to get ranking from classifier" << Endl;


   // Fill ranking object and return it

   fRanking = new Ranking(GetName(), "Variable Importance");

   Double_t* rankingData = (Double_t*) PyArray_DATA(pRanking);

   for(UInt_t iVar=0; iVar<fNvars; iVar++){

      fRanking->AddRank(Rank(GetInputLabel(iVar), rankingData[iVar]));

   }


   Py_DECREF(pRanking);


   return fRanking;

}


//_______________________________________________________________________


void MethodPyRandomForest::GetHelpMessage() const

{

   // typical length of text line:

   //       "|--------------------------------------------------------------|"

   Log() << "A random forest is a meta estimator that fits a number of decision" << Endl;

   Log() << "tree classifiers on various sub-samples of the dataset and use" << Endl;

   Log() << "averaging to improve the predictive accuracy and control over-fitting." << Endl;

   Log() << Endl;

   Log() << "Check out the scikit-learn documentation for more information." << Endl;

}


ClassifierFactory.h

REGISTER_METHOD
#define REGISTER_METHOD(CLASS)
for example
Definition ClassifierFactory.h:124

Configurable.h

DataSet.h

Event.h

IMethod.h

MethodPyRandomForest.h

MsgLogger.h

PDF.h

PyObject
_object PyObject
Definition PyMethodBase.h:36

e
#define e(i)
Definition RSha256.hxx:103

Ranking.h

Results.h

Bool_t
bool Bool_t
Boolean (0=false, 1=true) (bool).
Definition RtypesCore.h:77

Int_t
int Int_t
Signed integer 4 bytes (int).
Definition RtypesCore.h:59

UInt_t
unsigned int UInt_t
Unsigned integer 4 bytes (unsigned int).
Definition RtypesCore.h:60

kFALSE
constexpr Bool_t kFALSE
Definition RtypesCore.h:108

Double_t
double Double_t
Double 8 bytes.
Definition RtypesCore.h:73

Long64_t
long long Long64_t
Portable signed long integer 8 bytes.
Definition RtypesCore.h:83

kTRUE
constexpr Bool_t kTRUE
Definition RtypesCore.h:107

result
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t result
Definition TGWin32VirtualXProxy.cxx:174

type
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h Atom_t Int_t ULong_t ULong_t unsigned char prop_list Atom_t Atom_t Atom_t Time_t type
Definition TGWin32VirtualXProxy.cxx:249

TMatrix.h

err
Double_t err
Definition TMultiDimFit.cxx:1939

Form
char * Form(const char *fmt,...)
Formats a string in a circular formatting buffer.
Definition TString.cxx:2496

Timer.h

Tools.h

VariableTransformBase.h

Long64_t

TMVA::Configurable::DeclareOptionRef
OptionBase * DeclareOptionRef(T &ref, const TString &name, const TString &desc="")

TMVA::Configurable::Log
MsgLogger & Log() const
Definition Configurable.h:122

TMVA::DataSetInfo
Class that contains all the data information.
Definition DataSetInfo.h:62

TMVA::DataSetInfo::GetNClasses
UInt_t GetNClasses() const
Definition DataSetInfo.h:155

TMVA::DataSet::GetEvent
const Event * GetEvent() const
returns event without transformations
Definition DataSet.cxx:202

TMVA::DataSet::GetNEvents
Long64_t GetNEvents(Types::ETreeType type=Types::kMaxTreeType) const
Definition DataSet.h:206

TMVA::DataSet::GetNTrainingEvents
Long64_t GetNTrainingEvents() const
Definition DataSet.h:68

TMVA::DataSet::SetCurrentEvent
void SetCurrentEvent(Long64_t ievt) const
Definition DataSet.h:88

TMVA::DataSet::GetTrainingEvent
const Event * GetTrainingEvent(Long64_t ievt) const
Definition DataSet.h:74

TMVA::Event
Definition Event.h:51

TMVA::Internal::PyGILRAII
Definition MethodPyAdaBoost.cxx:47

TMVA::Internal::PyGILRAII::m_GILState
PyGILState_STATE m_GILState
Definition MethodPyAdaBoost.cxx:48

TMVA::Internal::PyGILRAII::~PyGILRAII
~PyGILRAII()
Definition MethodPyRandomForest.cxx:51

TMVA::Internal::PyGILRAII::PyGILRAII
PyGILRAII()
Definition MethodPyRandomForest.cxx:50

TMVA::MethodBase::GetName
const char * GetName() const override
Definition MethodBase.h:337

TMVA::MethodBase::DeclareCompatibilityOptions
virtual void DeclareCompatibilityOptions()
options that are used ONLY for the READER to ensure backward compatibility they are hence without any...
Definition MethodBase.cxx:595

TMVA::MethodBase::IsModelPersistence
Bool_t IsModelPersistence() const
Definition MethodBase.h:386

TMVA::MethodBase::GetWeightFileDir
const TString & GetWeightFileDir() const
Definition MethodBase.h:495

TMVA::MethodBase::DataInfo
DataSetInfo & DataInfo() const
Definition MethodBase.h:413

TMVA::MethodBase::TestClassification
virtual void TestClassification()
initialization
Definition MethodBase.cxx:1201

TMVA::MethodBase::GetNVariables
UInt_t GetNVariables() const
Definition MethodBase.h:348

TMVA::MethodBase::NoErrorCalc
void NoErrorCalc(Double_t *const err, Double_t *const errUpper)
Definition MethodBase.cxx:900

TMVA::MethodBase::GetInputLabel
const TString & GetInputLabel(Int_t i) const
Definition MethodBase.h:353

TMVA::MethodBase::fRanking
Ranking * fRanking
Definition MethodBase.h:590

TMVA::MethodBase::Data
DataSet * Data() const
Definition MethodBase.h:412

TMVA::MethodPyRandomForest::pMinWeightFractionLeaf
PyObject * pMinWeightFractionLeaf
Definition MethodPyRandomForest.h:115

TMVA::MethodPyRandomForest::pWarmStart
PyObject * pWarmStart
Definition MethodPyRandomForest.h:166

TMVA::MethodPyRandomForest::HasAnalysisType
Bool_t HasAnalysisType(Types::EAnalysisType type, UInt_t numberClasses, UInt_t numberTargets) override
Definition MethodPyRandomForest.cxx:111

TMVA::MethodPyRandomForest::pVerbose
PyObject * pVerbose
Definition MethodPyRandomForest.h:163

TMVA::MethodPyRandomForest::DeclareOptions
void DeclareOptions() override
Definition MethodPyRandomForest.cxx:119

TMVA::MethodPyRandomForest::Init
void Init() override
Definition MethodPyRandomForest.cxx:303

TMVA::MethodPyRandomForest::fMinSamplesSplit
Int_t fMinSamplesSplit
Definition MethodPyRandomForest.h:105

TMVA::MethodPyRandomForest::MethodPyRandomForest
MethodPyRandomForest(const TString &jobName, const TString &methodTitle, DataSetInfo &theData, const TString &theOption="")
Definition MethodPyRandomForest.cxx:60

TMVA::MethodPyRandomForest::pClassWeight
PyObject * pClassWeight
Definition MethodPyRandomForest.h:172

TMVA::MethodPyRandomForest::pMaxDepth
PyObject * pMaxDepth
Definition MethodPyRandomForest.h:99

TMVA::MethodPyRandomForest::fMinSamplesLeaf
Int_t fMinSamplesLeaf
Definition MethodPyRandomForest.h:109

TMVA::MethodPyRandomForest::fMaxFeatures
TString fMaxFeatures
Definition MethodPyRandomForest.h:122

TMVA::MethodPyRandomForest::fCriterion
TString fCriterion
Definition MethodPyRandomForest.h:94

TMVA::MethodPyRandomForest::pNjobs
PyObject * pNjobs
Definition MethodPyRandomForest.h:151

TMVA::MethodPyRandomForest::fBootstrap
Bool_t fBootstrap
Definition MethodPyRandomForest.h:144

TMVA::MethodPyRandomForest::pNestimators
PyObject * pNestimators
Definition MethodPyRandomForest.h:89

TMVA::MethodPyRandomForest::pBootstrap
PyObject * pBootstrap
Definition MethodPyRandomForest.h:143

TMVA::MethodPyRandomForest::pRandomState
PyObject * pRandomState
Definition MethodPyRandomForest.h:156

TMVA::MethodPyRandomForest::GetMvaValues
std::vector< Double_t > GetMvaValues(Long64_t firstEvt=0, Long64_t lastEvt=-1, Bool_t logProgress=false) override
get all the MVA values for the events of the current Data type
Definition MethodPyRandomForest.cxx:384

TMVA::MethodPyRandomForest::GetMulticlassValues
std::vector< Float_t > & GetMulticlassValues() override
Definition MethodPyRandomForest.cxx:461

TMVA::MethodPyRandomForest::fOobScore
Bool_t fOobScore
Definition MethodPyRandomForest.h:148

TMVA::MethodPyRandomForest::fNoutputs
UInt_t fNoutputs
Definition MethodPyRandomForest.h:84

TMVA::MethodPyRandomForest::pOobScore
PyObject * pOobScore
Definition MethodPyRandomForest.h:147

TMVA::MethodPyRandomForest::~MethodPyRandomForest
~MethodPyRandomForest(void)
Definition MethodPyRandomForest.cxx:106

TMVA::MethodPyRandomForest::pMaxLeafNodes
PyObject * pMaxLeafNodes
Definition MethodPyRandomForest.h:136

TMVA::MethodPyRandomForest::fVerbose
Int_t fVerbose
Definition MethodPyRandomForest.h:164

TMVA::MethodPyRandomForest::fClassWeight
TString fClassWeight
Definition MethodPyRandomForest.h:173

TMVA::MethodPyRandomForest::fMaxLeafNodes
TString fMaxLeafNodes
Definition MethodPyRandomForest.h:137

TMVA::MethodPyRandomForest::classValues
std::vector< Float_t > classValues
Definition MethodPyRandomForest.h:81

TMVA::MethodPyRandomForest::fNestimators
Int_t fNestimators
Definition MethodPyRandomForest.h:90

TMVA::MethodPyRandomForest::pMinSamplesLeaf
PyObject * pMinSamplesLeaf
Definition MethodPyRandomForest.h:108

TMVA::MethodPyRandomForest::Train
void Train() override
Definition MethodPyRandomForest.cxx:320

TMVA::MethodPyRandomForest::fFilenameClassifier
TString fFilenameClassifier
Definition MethodPyRandomForest.h:85

TMVA::MethodPyRandomForest::fRandomState
TString fRandomState
Definition MethodPyRandomForest.h:157

TMVA::MethodPyRandomForest::pCriterion
PyObject * pCriterion
Definition MethodPyRandomForest.h:93

TMVA::MethodPyRandomForest::mvaValues
std::vector< Double_t > mvaValues
Definition MethodPyRandomForest.h:80

TMVA::MethodPyRandomForest::GetHelpMessage
void GetHelpMessage() const override
Definition MethodPyRandomForest.cxx:537

TMVA::MethodPyRandomForest::pMaxFeatures
PyObject * pMaxFeatures
Definition MethodPyRandomForest.h:121

TMVA::MethodPyRandomForest::TestClassification
void TestClassification() override
initialization
Definition MethodPyRandomForest.cxx:378

TMVA::MethodPyRandomForest::fNjobs
Int_t fNjobs
Definition MethodPyRandomForest.h:152

TMVA::MethodPyRandomForest::fWarmStart
Bool_t fWarmStart
Definition MethodPyRandomForest.h:167

TMVA::MethodPyRandomForest::CreateRanking
const Ranking * CreateRanking() override
Definition MethodPyRandomForest.cxx:517

TMVA::MethodPyRandomForest::fMinWeightFractionLeaf
Double_t fMinWeightFractionLeaf
Definition MethodPyRandomForest.h:116

TMVA::MethodPyRandomForest::fMaxDepth
TString fMaxDepth
Definition MethodPyRandomForest.h:100

TMVA::MethodPyRandomForest::GetMvaValue
Double_t GetMvaValue(Double_t *errLower=nullptr, Double_t *errUpper=nullptr) override
Definition MethodPyRandomForest.cxx:429

TMVA::MethodPyRandomForest::ReadModelFromFile
void ReadModelFromFile() override
Definition MethodPyRandomForest.cxx:490

TMVA::MethodPyRandomForest::ProcessOptions
void ProcessOptions() override
Definition MethodPyRandomForest.cxx:196

TMVA::MethodPyRandomForest::pMinSamplesSplit
PyObject * pMinSamplesSplit
Definition MethodPyRandomForest.h:104

TMVA::MethodPyRandomForest::fNvars
UInt_t fNvars
Definition MethodPyRandomForest.h:83

TMVA::PyMethodBase::PyIsInitialized
static int PyIsInitialized()
Check Python interpreter initialization status.
Definition PyMethodBase.cxx:252

TMVA::PyMethodBase::Eval
PyObject * Eval(TString code)
Evaluate Python code.
Definition PyMethodBase.cxx:135

TMVA::PyMethodBase::PyInitialize
static void PyInitialize()
Initialize Python interpreter.
Definition PyMethodBase.cxx:152

TMVA::PyMethodBase::Serialize
static void Serialize(TString file, PyObject *classifier)
Serialize Python object.
Definition PyMethodBase.cxx:271

TMVA::PyMethodBase::UnSerialize
static Int_t UnSerialize(TString file, PyObject **obj)
Unserialize Python object.
Definition PyMethodBase.cxx:293

TMVA::PyMethodBase::fClassifier
PyObject * fClassifier
Definition PyMethodBase.h:108

TMVA::PyMethodBase::PyMethodBase
PyMethodBase(const TString &jobName, Types::EMVA methodType, const TString &methodTitle, DataSetInfo &dsi, const TString &theOption="")
Definition PyMethodBase.cxx:83

TMVA::PyMethodBase::PyRunString
void PyRunString(TString code, TString errorMessage="Failed to run python code", int start=256)
Execute Python code from string.
Definition PyMethodBase.cxx:324

TMVA::PyMethodBase::fLocalNS
PyObject * fLocalNS
Definition PyMethodBase.h:127

TMVA::Rank
Definition Ranking.h:76

TMVA::Ranking
Ranking for variables in method (implementation).
Definition Ranking.h:48

TMVA::Tools::Color
const TString & Color(const TString &)
human readable color strings
Definition Tools.cxx:803

TMVA::Types
Singleton class for Global types used by TMVA.
Definition Types.h:71

TMVA::Types::kSignal
@ kSignal
Never change this number - it is elsewhere assumed to be zero !
Definition Types.h:135

TMVA::Types::EAnalysisType
EAnalysisType
Definition Types.h:126

TMVA::Types::kMulticlass
@ kMulticlass
Definition Types.h:129

TMVA::Types::kClassification
@ kClassification
Definition Types.h:127

TString
Basic string class.
Definition TString.h:138

TMVA::Internal
Definition MethodPyAdaBoost.cxx:46

TMVA
create variable transformations
Definition GeneticMinimizer.h:22

TMVA::gTools
Tools & gTools()

TMVA::Endl
MsgLogger & Endl(MsgLogger &ml)
Definition MsgLogger.h:148

Config.h

Types.h