doc/v606/MethodPyRandomForest_8cxx_source.html

 // @(#)root/tmva/pymva $Id$

 // Authors: Omar Zapata, Lorenzo Moneta, Sergei Gleyzer 2015


 /**********************************************************************************

  * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

  * Package: TMVA                                                                  *

  * Class  : MethodPyRandomForest                                                  *

  * Web    : http://oproject.org                                                   *

  *                                                                                *

  * Description:                                                                   *

  *      Random Forest Classifiear from Scikit learn                               *

  *                                                                                *

  *                                                                                *

  * Redistribution and use in source and binary forms, with or without             *

  * modification, are permitted according to the terms listed in LICENSE           *

  * (http://tmva.sourceforge.net/LICENSE)                                          *

  *                                                                                *

  **********************************************************************************/

 #pragma GCC diagnostic ignored "-Wunused-parameter"

 #include <iomanip>

 #include <fstream>


 #include <Python.h>

 #define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION

 #include <numpy/arrayobject.h>


 #include "TMath.h"

 #include "Riostream.h"

 #include "TMatrix.h"

 #include "TMatrixD.h"

 #include "TVectorD.h"


 #include "TMVA/VariableTransformBase.h"

 #include "TMVA/MethodPyRandomForest.h"

 #include "TMVA/Tools.h"

 #include "TMVA/Ranking.h"

 #include "TMVA/Types.h"

 #include "TMVA/Config.h"

 #include "TMVA/PDF.h"

 #include "TMVA/ClassifierFactory.h"


 #include "TMVA/Results.h"


 using namespace TMVA;


 REGISTER_METHOD(PyRandomForest)


 ClassImp(MethodPyRandomForest)


 //_______________________________________________________________________

 MethodPyRandomForest::MethodPyRandomForest(const TString &jobName,

       const TString &methodTitle,

       DataSetInfo &dsi,

       const TString &theOption,

       TDirectory *theTargetDir) :

    PyMethodBase(jobName, Types::kPyRandomForest, methodTitle, dsi, theOption, theTargetDir),

    n_estimators(10),

    criterion("gini"),

    max_depth("None"),

    min_samples_split(2),

    min_samples_leaf(1),

    min_weight_fraction_leaf(0),

    max_features("'auto'"),

    max_leaf_nodes("None"),

    bootstrap(kTRUE),

    oob_score(kFALSE),

    n_jobs(1),

    random_state("None"),

    verbose(0),

    warm_start(kFALSE),

    class_weight("None")

 {

    // standard constructor for the PyRandomForest

    SetWeightFileDir(gConfig().GetIONames().fWeightFileDir);


 }


 //_______________________________________________________________________

 MethodPyRandomForest::MethodPyRandomForest(DataSetInfo &theData, const TString &theWeightFile, TDirectory *theTargetDir)

    : PyMethodBase(Types::kPyRandomForest, theData, theWeightFile, theTargetDir),

      n_estimators(10),

      criterion("gini"),

      max_depth("None"),

      min_samples_split(2),

      min_samples_leaf(1),

      min_weight_fraction_leaf(0),

      max_features("'auto'"),

      max_leaf_nodes("None"),

      bootstrap(kTRUE),

      oob_score(kFALSE),

      n_jobs(1),

      random_state("None"),

      verbose(0),

      warm_start(kFALSE),

      class_weight("None")

 {

    SetWeightFileDir(gConfig().GetIONames().fWeightFileDir);

 }


 //_______________________________________________________________________

 MethodPyRandomForest::~MethodPyRandomForest(void)

 {

 }


 //_______________________________________________________________________

 Bool_t MethodPyRandomForest::HasAnalysisType(Types::EAnalysisType type, UInt_t numberClasses, UInt_t numberTargets)

 {

    if (type == Types::kClassification && numberClasses == 2) return kTRUE;

    return kFALSE;

 }


 //_______________________________________________________________________

 void MethodPyRandomForest::DeclareOptions()

 {

    MethodBase::DeclareCompatibilityOptions();


    DeclareOptionRef(n_estimators, "NEstimators", "Integer, optional (default=10). The number of trees in the forest.");

    DeclareOptionRef(criterion, "Criterion", "//string, optional (default='gini') \

     The function to measure the quality of a split. Supported criteria are \

     'gini' for the Gini impurity and 'entropy' for the information gain. \

     Note: this parameter is tree-specific.");


    DeclareOptionRef(max_depth, "MaxDepth", "integer or None, optional (default=None) \

                                              The maximum depth of the tree. If None, then nodes are expanded until \

                                              all leaves are pure or until all leaves contain less than \

                                              min_samples_split samples. \

                                              Ignored if ``max_leaf_nodes`` is not None.");

    DeclareOptionRef(min_samples_split, "MinSamplesSplit", "integer, optional (default=2)\

     The minimum number of samples required to split an internal node.");


    DeclareOptionRef(min_samples_leaf, "MinSamplesLeaf", "integer, optional (default=1) \

     The minimum number of samples in newly created leaves.  A split is \

     discarded if after the split, one of the leaves would contain less then \

     ``min_samples_leaf`` samples.");

    DeclareOptionRef(min_weight_fraction_leaf, "MinWeightFractionLeaf", "//float, optional (default=0.) \

     The minimum weighted fraction of the input samples required to be at a \

     leaf node.");

    DeclareOptionRef(max_features, "MaxFeatures", "The number of features to consider when looking for the best split");

    DeclareOptionRef(max_leaf_nodes, "MaxLeafNodes", "int or None, optional (default=None)\

     Grow trees with ``max_leaf_nodes`` in best-first fashion.\

     Best nodes are defined as relative reduction in impurity.\

     If None then unlimited number of leaf nodes.\

     If not None then ``max_depth`` will be ignored.");

    DeclareOptionRef(bootstrap, "Bootstrap", "boolean, optional (default=True) \

     Whether bootstrap samples are used when building trees.");

    DeclareOptionRef(oob_score, "OoBScore", " bool Whether to use out-of-bag samples to estimate\

     the generalization error.");

    DeclareOptionRef(n_jobs, "NJobs", " integer, optional (default=1) \

     The number of jobs to run in parallel for both `fit` and `predict`. \

     If -1, then the number of jobs is set to the number of cores.");


    DeclareOptionRef(random_state, "RandomState", "int, RandomState instance or None, optional (default=None)\

     If int, random_state is the seed used by the random number generator;\

     If RandomState instance, random_state is the random number generator;\

     If None, the random number generator is the RandomState instance used\

     by `np.random`.");

    DeclareOptionRef(verbose, "Verbose", "int, optional (default=0)\

     Controls the verbosity of the tree building process.");

    DeclareOptionRef(warm_start, "WarmStart", "bool, optional (default=False)\

     When set to ``True``, reuse the solution of the previous call to fit\

     and add more estimators to the ensemble, otherwise, just fit a whole\

     new forest.");

    DeclareOptionRef(class_weight, "ClassWeight", "dict, list of dicts, \"auto\", \"subsample\" or None, optional\

     Weights associated with classes in the form ``{class_label: weight}``.\

     If not given, all classes are supposed to have weight one. For\

     multi-output problems, a list of dicts can be provided in the same\

     order as the columns of y.\

     The \"auto\" mode uses the values of y to automatically adjust\

     weights inversely proportional to class frequencies in the input data.\

     The \"subsample\" mode is the same as \"auto\" except that weights are\

     computed based on the bootstrap sample for every tree grown.\

     For multi-output, the weights of each column of y will be multiplied.\

     Note that these weights will be multiplied with sample_weight (passed\

     through the fit method) if sample_weight is specified.");

 }


 //_______________________________________________________________________

 void MethodPyRandomForest::ProcessOptions()

 {

    if (n_estimators <= 0) {

       Log() << kERROR << " NEstimators <=0... that does not work !! "

             << " I set it to 10 .. just so that the program does not crash"

             << Endl;

       n_estimators = 10;

    }

    if (criterion != "gini" && criterion != "entropy") {

       Log() << kFATAL << Form(" Criterion = %s... that does not work !! ", criterion.Data())

             << " The options are gini of entropy."

             << Endl;

    }

    PyObject *pomax_depth = Eval(max_depth);

    if (!pomax_depth) {

       Log() << kFATAL << Form(" MaxDepth = %s... that does not work !! ", criterion.Data())

             << " The options are None or integer."

             << Endl;

    }

    Py_DECREF(pomax_depth);


    if (min_samples_split < 0) {

       Log() << kERROR << " MinSamplesSplit < 0... that does not work !! "

             << " I set it to 2 .. just so that the program does not crash"

             << Endl;

       min_samples_split = 2;

    }

    if (min_samples_leaf < 0) {

       Log() << kERROR << " MinSamplesLeaf < 0... that does not work !! "

             << " I set it to 1 .. just so that the program does not crash"

             << Endl;

       min_samples_leaf = 1;

    }


    if (min_weight_fraction_leaf < 0) {

       Log() << kERROR << " MinWeightFractionLeaf < 0... that does not work !! "

             << " I set it to 0 .. just so that the program does not crash"

             << Endl;

       min_weight_fraction_leaf = 0;

    }

    if (max_features == "auto" || max_features == "sqrt" || max_features == "log2")max_features = Form("'%s'", max_features.Data());

    PyObject *pomax_features = Eval(max_features);

    if (!pomax_features) {

       Log() << kFATAL << Form(" MaxFeatures = %s... that does not work !! ", max_features.Data())

             << "int, float, string or None, optional (default='auto')"

             << "The number of features to consider when looking for the best split:"

             << "If int, then consider `max_features` features at each split."

             << "If float, then `max_features` is a percentage and"

             << "`int(max_features * n_features)` features are considered at each split."

             << "If 'auto', then `max_features=sqrt(n_features)`."

             << "If 'sqrt', then `max_features=sqrt(n_features)`."

             << "If 'log2', then `max_features=log2(n_features)`."

             << "If None, then `max_features=n_features`."

             << Endl;

    }

    Py_DECREF(pomax_features);


    PyObject *pomax_leaf_nodes = Eval(max_leaf_nodes);

    if (!pomax_leaf_nodes) {

       Log() << kFATAL << Form(" MaxLeafNodes = %s... that does not work !! ", max_leaf_nodes.Data())

             << " The options are None or integer."

             << Endl;

    }

    Py_DECREF(pomax_leaf_nodes);


 //    bootstrap(kTRUE),

 //    oob_score(kFALSE),

 //    n_jobs(1),


    PyObject *porandom_state = Eval(random_state);

    if (!porandom_state) {

       Log() << kFATAL << Form(" RandomState = %s... that does not work !! ", random_state.Data())

             << "If int, random_state is the seed used by the random number generator;"

             << "If RandomState instance, random_state is the random number generator;"

             << "If None, the random number generator is the RandomState instance used by `np.random`."

             << Endl;

    }

    Py_DECREF(porandom_state);


 //    verbose(0),

 //    warm_start(kFALSE),

 //    class_weight("None")

    PyObject *poclass_weight = Eval(class_weight);

    if (!poclass_weight) {

       Log() << kFATAL << Form(" ClassWeight = %s... that does not work !! ", class_weight.Data())

             << "dict, list of dicts, 'auto', 'subsample' or None, optional"

             << Endl;

    }

    Py_DECREF(poclass_weight);


 }


 //_______________________________________________________________________

 void  MethodPyRandomForest::Init()

 {

    ProcessOptions();

    _import_array();//require to use numpy arrays


    //Import sklearn

    // Convert the file name to a Python string.

    PyObject *pName = PyUnicode_FromString("sklearn.ensemble");

    // Import the file as a Python module.

    fModule = PyImport_Import(pName);

    Py_DECREF(pName);


    if (!fModule) {

       Log() << kFATAL << "Can't import sklearn.ensemble" << Endl;

       Log() << Endl;

    }


    //Training data

    UInt_t fNvars = Data()->GetNVariables();

    int fNrowsTraining = Data()->GetNTrainingEvents(); //every row is an event, a class type and a weight

    int *dims = new int[2];

    dims[0] = fNrowsTraining;

    dims[1] = fNvars;

    fTrainData = (PyArrayObject *)PyArray_FromDims(2, dims, NPY_FLOAT);

    float *TrainData = (float *)(PyArray_DATA(fTrainData));


    fTrainDataClasses = (PyArrayObject *)PyArray_FromDims(1, &fNrowsTraining, NPY_FLOAT);

    float *TrainDataClasses = (float *)(PyArray_DATA(fTrainDataClasses));


    fTrainDataWeights = (PyArrayObject *)PyArray_FromDims(1, &fNrowsTraining, NPY_FLOAT);

    float *TrainDataWeights = (float *)(PyArray_DATA(fTrainDataWeights));


    for (int i = 0; i < fNrowsTraining; i++) {

       const TMVA::Event *e = Data()->GetTrainingEvent(i);

       for (UInt_t j = 0; j < fNvars; j++) {

          TrainData[j + i * fNvars] = e->GetValue(j);

       }

       if (e->GetClass() == TMVA::Types::kSignal) TrainDataClasses[i] = TMVA::Types::kSignal;

       else TrainDataClasses[i] = TMVA::Types::kBackground;


       TrainDataWeights[i] = e->GetWeight();

    }


    delete dims;


 }


 //_______________________________________________________________________

 void MethodPyRandomForest::Train()

 {


    //NOTE: max_features must have 3 defferents variables int, float and string

    if (max_features == "auto" || max_features == "sqrt" || max_features == "log2")max_features = Form("'%s'", max_features.Data());

    PyObject *pomax_features = Eval(max_features);

    PyObject *pomax_depth = Eval(max_depth);

    PyObject *pomax_leaf_nodes = Eval(max_leaf_nodes);

    PyObject *porandom_state = Eval(random_state);

    PyObject *poclass_weight = Eval(class_weight);


    PyObject *args = Py_BuildValue("(isOiifOOiiiOiiO)", n_estimators, criterion.Data(), pomax_depth, min_samples_split, \

                                   min_samples_leaf, min_weight_fraction_leaf, pomax_features, pomax_leaf_nodes, \

                                   bootstrap, oob_score, n_jobs, porandom_state, verbose, warm_start, poclass_weight);

    Py_DECREF(pomax_depth);

    PyObject_Print(args, stdout, 0);

    std::cout << std::endl;


    PyObject *pDict = PyModule_GetDict(fModule);

    PyObject *fClassifierClass = PyDict_GetItemString(pDict, "RandomForestClassifier");

    //    Log() << kFATAL <<"Train =" <<n_jobs<<Endl;


    // Create an instance of the class

    if (PyCallable_Check(fClassifierClass)) {

       //instance

       fClassifier = PyObject_CallObject(fClassifierClass , args);

       PyObject_Print(fClassifier, stdout, 0);


       Py_DECREF(args);

    } else {

       PyErr_Print();

       Py_DECREF(pDict);

       Py_DECREF(fClassifierClass);

       Log() << kFATAL << "Can't call function RandomForestClassifier" << Endl;

       Log() << Endl;


    }


    fClassifier = PyObject_CallMethod(fClassifier, const_cast<char *>("fit"), const_cast<char *>("(OOO)"), fTrainData, fTrainDataClasses, fTrainDataWeights);


    if(!fClassifier)

    {

       Log() << kFATAL << "Can't create classifier object from RandomForestClassifier" << Endl;

       Log() << Endl;

    }


    TString path = GetWeightFileDir() + "/PyRFModel.PyData";

    Log() << Endl;

    Log() << gTools().Color("bold") << "--- Saving State File In:" << gTools().Color("reset") << path << Endl;

    Log() << Endl;

    Serialize(path,fClassifier);

 }


 //_______________________________________________________________________

 void MethodPyRandomForest::TestClassification()

 {

    MethodBase::TestClassification();

 }


 //_______________________________________________________________________

 Double_t MethodPyRandomForest::GetMvaValue(Double_t *errLower, Double_t *errUpper)

 {

    // cannot determine error

    NoErrorCalc(errLower, errUpper);


    if (!fClassifier) ReadStateFromFile();


    Double_t mvaValue;

    const TMVA::Event *e = Data()->GetEvent();

    UInt_t nvars = e->GetNVariables();

    int *dims = new int[2];

    dims[0] = 1;

    dims[1] = nvars;

    PyArrayObject *pEvent= (PyArrayObject *)PyArray_FromDims(2, dims, NPY_FLOAT);

    float *pValue = (float *)(PyArray_DATA(pEvent));


    for (UInt_t i = 0; i < nvars; i++) pValue[i] = e->GetValue(i);


    PyArrayObject *result = (PyArrayObject *)PyObject_CallMethod(fClassifier, const_cast<char *>("predict_proba"), const_cast<char *>("(O)"), pEvent);

    double *proba = (double *)(PyArray_DATA(result));

    mvaValue = proba[0]; //getting signal prob

    Py_DECREF(result);

    Py_DECREF(pEvent);

    delete dims;

    return mvaValue;

 }


 //_______________________________________________________________________

 void MethodPyRandomForest::ReadStateFromFile()

 {

    if (!PyIsInitialized()) {

       PyInitialize();

    }


    TString path = GetWeightFileDir() + "/PyRFModel.PyData";

    Log() << Endl;

    Log() << gTools().Color("bold") << "--- Loading State File From:" << gTools().Color("reset") << path << Endl;

    Log() << Endl;

    UnSerialize(path,&fClassifier);

    if(!fClassifier)

    {

      Log() << kFATAL << "Can't load RandomForestClassifier from Serialized data." << Endl;

      Log() << Endl;

    }

 }


 //_______________________________________________________________________

 void MethodPyRandomForest::GetHelpMessage() const

 {

    // get help message text

    //

    // typical length of text line:

    //         "|--------------------------------------------------------------|"

    Log() << Endl;

    Log() << gTools().Color("bold") << "--- Short description:" << gTools().Color("reset") << Endl;

    Log() << Endl;

    Log() << "Decision Trees and Rule-Based Models " << Endl;

    Log() << Endl;

    Log() << gTools().Color("bold") << "--- Performance optimisation:" << gTools().Color("reset") << Endl;

    Log() << Endl;

    Log() << Endl;

    Log() << gTools().Color("bold") << "--- Performance tuning via configuration options:" << gTools().Color("reset") << Endl;

    Log() << Endl;

    Log() << "<None>" << Endl;

 }


TMVA::MethodPyRandomForest::HasAnalysisType
Bool_t HasAnalysisType(Types::EAnalysisType type, UInt_t numberClasses, UInt_t numberTargets)
Definition: MethodPyRandomForest.cxx:109

TMVA::MethodBase::GetWeightFileDir
const TString & GetWeightFileDir() const
Definition: MethodBase.h:407

TMVA::MethodPyRandomForest::~MethodPyRandomForest
~MethodPyRandomForest(void)
Definition: MethodPyRandomForest.cxx:104

TMVA::kFATAL
Definition: Types.h:67

TMVA::MethodPyRandomForest::oob_score
Bool_t oob_score
Definition: MethodPyRandomForest.h:127

TMVA::Endl
MsgLogger & Endl(MsgLogger &ml)
Definition: MsgLogger.h:162

Types.h

TMVA::Types
Definition: Types.h:74

TMVA::MethodPyRandomForest::criterion
TString criterion
Definition: MethodPyRandomForest.h:86

TMVA::PyMethodBase::fClassifier
PyObject * fClassifier
Definition: PyMethodBase.h:114

MethodPyRandomForest.h

TMVA::MethodPyRandomForest::random_state
TString random_state
Definition: MethodPyRandomForest.h:132

TMVA::DataSet::GetTrainingEvent
const Event * GetTrainingEvent(Long64_t ievt) const
Definition: DataSet.h:96

TMVA::gConfig
Config & gConfig()

TMVA::Configurable::DeclareOptionRef
OptionBase * DeclareOptionRef(T &ref, const TString &name, const TString &desc="")

TMVA::MethodBase::Data
DataSet * Data() const
Definition: MethodBase.h:363

TMVA::Types::EAnalysisType
EAnalysisType
Definition: Types.h:124

TMVA::MethodPyRandomForest::Train
void Train()
Definition: MethodPyRandomForest.cxx:325

TMVA::MethodPyRandomForest::n_jobs
Int_t n_jobs
Definition: MethodPyRandomForest.h:129

TString
Basic string class.
Definition: TString.h:137

Bool_t
bool Bool_t
Definition: RtypesCore.h:59

TMVA::MethodPyRandomForest::bootstrap
Bool_t bootstrap
Definition: MethodPyRandomForest.h:125

kFALSE
const Bool_t kFALSE
Definition: Rtypes.h:92

TMVA::PyMethodBase
Definition: PyMethodBase.h:61

TMVA::PyMethodBase::Serialize
static void Serialize(TString file, PyObject *classifier)
Definition: PyMethodBase.cxx:189

TMVA::Event::GetWeight
Double_t GetWeight() const
return the event weight - depending on whether the flag IgnoreNegWeightsInTraining is or not...
Definition: Event.cxx:376

TMVA::MethodPyRandomForest::max_features
TString max_features
Definition: MethodPyRandomForest.h:107

TMVA::PyMethodBase::fTrainDataClasses
PyArrayObject * fTrainDataClasses
Definition: PyMethodBase.h:118

TMVA::PyMethodBase::PyIsInitialized
static int PyIsInitialized()
Definition: PyMethodBase.cxx:179

Config.h

TMVA::PyMethodBase::PyInitialize
static void PyInitialize()
Definition: PyMethodBase.cxx:85

TMVA::Types::kBackground
Definition: Types.h:134

TMVA::Event::GetValue
Float_t GetValue(UInt_t ivar) const
return value of i'th variable
Definition: Event.cxx:231

TString::Data
const char * Data() const
Definition: TString.h:349

TVectorD.h

PDF.h

TMVA::MethodPyRandomForest::DeclareOptions
void DeclareOptions()
Definition: MethodPyRandomForest.cxx:117

TMVA::gTools
Tools & gTools()
Definition: Tools.cxx:79

TMVA::MethodPyRandomForest
Definition: MethodPyRandomForest.h:35

TMVA::MethodPyRandomForest::min_weight_fraction_leaf
Double_t min_weight_fraction_leaf
Definition: MethodPyRandomForest.h:103

TMVA::MethodPyRandomForest::Init
void Init()
Definition: MethodPyRandomForest.cxx:275

TMVA::PyMethodBase::Eval
static PyObject * Eval(TString code)
Definition: PyMethodBase.cxx:75

TMVA::DataSetInfo
Definition: DataSetInfo.h:78

TMVA::kERROR
Definition: Types.h:66

TMVA::PyMethodBase::fTrainDataWeights
PyArrayObject * fTrainDataWeights
Definition: PyMethodBase.h:117

TMVA::MethodPyRandomForest::GetMvaValue
Double_t GetMvaValue(Double_t *errLower=0, Double_t *errUpper=0)
Definition: MethodPyRandomForest.cxx:386

TMVA::Event::GetNVariables
UInt_t GetNVariables() const
accessor to the number of variables
Definition: Event.cxx:303

Ranking.h

None
#define None
Definition: TGWin32.h:68

TMVA::PyMethodBase::fModule
PyObject * fModule
Definition: PyMethodBase.h:113

TMVA::MethodPyRandomForest::GetHelpMessage
void GetHelpMessage() const
Definition: MethodPyRandomForest.cxx:433

TMVA::Event
Definition: Event.h:57

UInt_t
unsigned int UInt_t
Definition: RtypesCore.h:42

verbose
bool verbose
Definition: binarySearchTime.cxx:27

Form
char * Form(const char *fmt,...)

TMVA::Types::kClassification
Definition: Types.h:125

TMVA::PyMethodBase::fTrainData
PyArrayObject * fTrainData
Definition: PyMethodBase.h:116

TMVA::MethodPyRandomForest::max_depth
TString max_depth
Definition: MethodPyRandomForest.h:91

Riostream.h

TMVA::DataSet::GetEvent
const Event * GetEvent() const
Definition: DataSet.cxx:180

Double_t
double Double_t
Definition: RtypesCore.h:55

TDirectory
Describe directory structure in memory.
Definition: TDirectory.h:41

type
int type
Definition: TGX11.cxx:120

TMVA::Configurable::Log
MsgLogger & Log() const
Definition: Configurable.h:130

TMVA::DataSet::GetNVariables
UInt_t GetNVariables() const
access the number of variables through the datasetinfo
Definition: DataSet.cxx:194

TMVA::MethodPyRandomForest::ReadStateFromFile
void ReadStateFromFile()
Definition: MethodPyRandomForest.cxx:414

TMVA::Event::GetClass
UInt_t GetClass() const
Definition: Event.h:86

TMVA::MethodPyRandomForest::warm_start
Bool_t warm_start
Definition: MethodPyRandomForest.h:138

TMVA::Tools::Color
const TString & Color(const TString &)
human readable color strings
Definition: Tools.cxx:837

Results.h

ClassImp
ClassImp(MethodPyRandomForest) MethodPyRandomForest
Definition: MethodPyRandomForest.cxx:50

TMVA::MethodPyRandomForest::class_weight
TString class_weight
Definition: MethodPyRandomForest.h:142

REGISTER_METHOD
#define REGISTER_METHOD(CLASS)
for example
Definition: ClassifierFactory.h:126

TMVA::MethodPyRandomForest::ProcessOptions
void ProcessOptions()
Definition: MethodPyRandomForest.cxx:182

TMVA
Abstract ClassifierFactory template that handles arbitrary types.
Definition: MethodPyAdaBoost.h:29

VariableTransformBase.h

Tools.h

TMVA::MethodPyRandomForest::MethodPyRandomForest
MethodPyRandomForest(const TString &jobName, const TString &methodTitle, DataSetInfo &theData, const TString &theOption="", TDirectory *theTargetDir=NULL)

TMatrixD.h

TMVA::MethodBase::DeclareCompatibilityOptions
virtual void DeclareCompatibilityOptions()
options that are used ONLY for the READER to ensure backward compatibility they are hence without any...
Definition: MethodBase.cxx:599

TMVA::MethodBase::SetWeightFileDir
void SetWeightFileDir(TString fileDir)
set directory of weight file
Definition: MethodBase.cxx:1944

TMVA::MethodPyRandomForest::TestClassification
virtual void TestClassification()
initialization
Definition: MethodPyRandomForest.cxx:379

TMatrix.h

TMVA::MethodPyRandomForest::verbose
Int_t verbose
Definition: MethodPyRandomForest.h:137

TMVA::MethodPyRandomForest::min_samples_leaf
Int_t min_samples_leaf
Definition: MethodPyRandomForest.h:98

TMVA::DataSet::GetNTrainingEvents
Long64_t GetNTrainingEvents() const
Definition: DataSet.h:90

result
double result[121]
Definition: testSampleQuantiles.cxx:17

TMath.h

TMVA::PyMethodBase::UnSerialize
static void UnSerialize(TString file, PyObject **obj)
Definition: PyMethodBase.cxx:203

kTRUE
const Bool_t kTRUE
Definition: Rtypes.h:91

TMVA::MethodPyRandomForest::n_estimators
Int_t n_estimators
Definition: MethodPyRandomForest.h:84

ClassifierFactory.h

TMVA::MethodPyRandomForest::max_leaf_nodes
TString max_leaf_nodes
Definition: MethodPyRandomForest.h:120

TMVA::MethodBase::TestClassification
virtual void TestClassification()
initialization
Definition: MethodBase.cxx:1046

TMVA::MethodPyRandomForest::min_samples_split
Int_t min_samples_split
Definition: MethodPyRandomForest.h:94

PyObject
_object PyObject
Definition: TPyArg.h:22

TMVA::MethodBase::NoErrorCalc
void NoErrorCalc(Double_t *const err, Double_t *const errUpper)
Definition: MethodBase.cxx:820

TMVA::Types::kSignal
Definition: Types.h:133