Logo ROOT  
Reference Guide
 
Loading...
Searching...
No Matches
ROOT::Experimental::Internal::ML::RDatasetLoader< Args > Class Template Reference

template<typename... Args>
class ROOT::Experimental::Internal::ML::RDatasetLoader< Args >

Load the whole dataset into memory.

In this class the whole dataset is loaded into memory. The dataset is further shuffled and spit into training and validation sets with the user-defined validation split fraction.

Definition at line 102 of file RDatasetLoader.hxx.

Public Member Functions

 RDatasetLoader (const std::vector< ROOT::RDF::RNode > &rdfs, const float validationSplit, const std::vector< std::string > &cols, const std::vector< std::size_t > &vecSizes={}, const float vecPadding=0.0, bool shuffle=true, const std::size_t setSeed=0)
 
void ConcatenateDatasets ()
 Concatenate the datasets to a dataset.
 
std::size_t GetNumTrainingEntries ()
 
std::size_t GetNumValidationEntries ()
 
RFlat2DMatrix GetTrainingDataset ()
 
std::vector< RFlat2DMatrixGetTrainingDatasets ()
 
RFlat2DMatrix GetValidationDataset ()
 
std::vector< RFlat2DMatrixGetValidationDatasets ()
 
void SplitDataframe (ROOT::RDF::RNode &rdf, RFlat2DMatrix &TrainingDataset, RFlat2DMatrix &ValidationDataset)
 Split an individual dataframe into a training and validation dataset.
 
void SplitDatasets ()
 Split the dataframes in a training and validation dataset.
 

Private Attributes

std::vector< ROOT::RDF::RNodef_rdfs
 
std::vector< std::string > fCols
 
ROOT::RDF::RResultPtr< std::vector< ULong64_t > > fEntries
 
bool fNotFiltered
 
std::size_t fNumCols
 
std::size_t fNumDatasetCols
 
std::size_t fNumEntries
 
std::size_t fNumTrainingEntries
 
std::size_t fNumValidationEntries
 
std::size_t fSetSeed
 
bool fShuffle
 
std::size_t fSumVecSizes
 
std::unique_ptr< RFlat2DMatrixOperatorsfTensorOperators
 
RFlat2DMatrix fTrainingDataset
 
std::vector< RFlat2DMatrixfTrainingDatasets
 
RFlat2DMatrix fValidationDataset
 
std::vector< RFlat2DMatrixfValidationDatasets
 
float fValidationSplit
 
std::size_t fVecPadding
 
std::vector< std::size_t > fVecSizes
 

#include <ROOT/ML/RDatasetLoader.hxx>

Constructor & Destructor Documentation

◆ RDatasetLoader()

template<typename... Args>
ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::RDatasetLoader ( const std::vector< ROOT::RDF::RNode > & rdfs,
const float validationSplit,
const std::vector< std::string > & cols,
const std::vector< std::size_t > & vecSizes = {},
const float vecPadding = 0.0,
bool shuffle = true,
const std::size_t setSeed = 0 )
inline

Definition at line 133 of file RDatasetLoader.hxx.

Member Function Documentation

◆ ConcatenateDatasets()

template<typename... Args>
void ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::ConcatenateDatasets ( )
inline

Concatenate the datasets to a dataset.

Definition at line 220 of file RDatasetLoader.hxx.

◆ GetNumTrainingEntries()

template<typename... Args>
std::size_t ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::GetNumTrainingEntries ( )
inline

Definition at line 232 of file RDatasetLoader.hxx.

◆ GetNumValidationEntries()

template<typename... Args>
std::size_t ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::GetNumValidationEntries ( )
inline

Definition at line 233 of file RDatasetLoader.hxx.

◆ GetTrainingDataset()

template<typename... Args>
RFlat2DMatrix ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::GetTrainingDataset ( )
inline

Definition at line 229 of file RDatasetLoader.hxx.

◆ GetTrainingDatasets()

template<typename... Args>
std::vector< RFlat2DMatrix > ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::GetTrainingDatasets ( )
inline

Definition at line 226 of file RDatasetLoader.hxx.

◆ GetValidationDataset()

template<typename... Args>
RFlat2DMatrix ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::GetValidationDataset ( )
inline

Definition at line 230 of file RDatasetLoader.hxx.

◆ GetValidationDatasets()

template<typename... Args>
std::vector< RFlat2DMatrix > ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::GetValidationDatasets ( )
inline

Definition at line 227 of file RDatasetLoader.hxx.

◆ SplitDataframe()

template<typename... Args>
void ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::SplitDataframe ( ROOT::RDF::RNode & rdf,
RFlat2DMatrix & TrainingDataset,
RFlat2DMatrix & ValidationDataset )
inline

Split an individual dataframe into a training and validation dataset.

Parameters
[in]rdfDataframe that will be split into training and validation
[in]TrainingDatasetTensor for the training dataset
[in]ValidationDatasetTensor for the validation dataset

Definition at line 156 of file RDatasetLoader.hxx.

◆ SplitDatasets()

template<typename... Args>
void ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::SplitDatasets ( )
inline

Split the dataframes in a training and validation dataset.

Definition at line 198 of file RDatasetLoader.hxx.

Member Data Documentation

◆ f_rdfs

template<typename... Args>
std::vector<ROOT::RDF::RNode> ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::f_rdfs
private

Definition at line 122 of file RDatasetLoader.hxx.

◆ fCols

template<typename... Args>
std::vector<std::string> ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fCols
private

Definition at line 123 of file RDatasetLoader.hxx.

◆ fEntries

template<typename... Args>
ROOT::RDF::RResultPtr<std::vector<ULong64_t> > ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fEntries
private

Definition at line 130 of file RDatasetLoader.hxx.

◆ fNotFiltered

template<typename... Args>
bool ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fNotFiltered
private

Definition at line 127 of file RDatasetLoader.hxx.

◆ fNumCols

template<typename... Args>
std::size_t ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fNumCols
private

Definition at line 124 of file RDatasetLoader.hxx.

◆ fNumDatasetCols

template<typename... Args>
std::size_t ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fNumDatasetCols
private

Definition at line 110 of file RDatasetLoader.hxx.

◆ fNumEntries

template<typename... Args>
std::size_t ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fNumEntries
private

Definition at line 104 of file RDatasetLoader.hxx.

◆ fNumTrainingEntries

template<typename... Args>
std::size_t ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fNumTrainingEntries
private

Definition at line 118 of file RDatasetLoader.hxx.

◆ fNumValidationEntries

template<typename... Args>
std::size_t ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fNumValidationEntries
private

Definition at line 119 of file RDatasetLoader.hxx.

◆ fSetSeed

template<typename... Args>
std::size_t ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fSetSeed
private

Definition at line 125 of file RDatasetLoader.hxx.

◆ fShuffle

template<typename... Args>
bool ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fShuffle
private

Definition at line 128 of file RDatasetLoader.hxx.

◆ fSumVecSizes

template<typename... Args>
std::size_t ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fSumVecSizes
private

Definition at line 108 of file RDatasetLoader.hxx.

◆ fTensorOperators

template<typename... Args>
std::unique_ptr<RFlat2DMatrixOperators> ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fTensorOperators
private

Definition at line 120 of file RDatasetLoader.hxx.

◆ fTrainingDataset

template<typename... Args>
RFlat2DMatrix ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fTrainingDataset
private

Definition at line 115 of file RDatasetLoader.hxx.

◆ fTrainingDatasets

template<typename... Args>
std::vector<RFlat2DMatrix> ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fTrainingDatasets
private

Definition at line 112 of file RDatasetLoader.hxx.

◆ fValidationDataset

template<typename... Args>
RFlat2DMatrix ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fValidationDataset
private

Definition at line 116 of file RDatasetLoader.hxx.

◆ fValidationDatasets

template<typename... Args>
std::vector<RFlat2DMatrix> ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fValidationDatasets
private

Definition at line 113 of file RDatasetLoader.hxx.

◆ fValidationSplit

template<typename... Args>
float ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fValidationSplit
private

Definition at line 105 of file RDatasetLoader.hxx.

◆ fVecPadding

template<typename... Args>
std::size_t ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fVecPadding
private

Definition at line 109 of file RDatasetLoader.hxx.

◆ fVecSizes

template<typename... Args>
std::vector<std::size_t> ROOT::Experimental::Internal::ML::RDatasetLoader< Args >::fVecSizes
private

Definition at line 107 of file RDatasetLoader.hxx.

  • tree/ml/inc/ROOT/ML/RDatasetLoader.hxx