doc/v618/TensorDataLoader_8h_source.html

// @(#)root/tmva/tmva/dnn:$Id$

// Author: Vladimir Ilievski


/**********************************************************************************

 * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

 * Package: TMVA                                                                  *

 * Class  : TTensorDataLoader                                                     *

 * Web    : http://tmva.sourceforge.net                                           *

 *                                                                                *

 * Description:                                                                   *

 *      Tensor Data Loader Class                                                  *

 *                                                                                *

 * Authors (alphabetical):                                                        *

 *      Vladimir Ilievski      <ilievski.vladimir@live.com>  - CERN, Switzerland  *

 *                                                                                *

 * Copyright (c) 2005-2015:                                                       *

 *      CERN, Switzerland                                                         *

 *      U. of Victoria, Canada                                                    *

 *      MPI-K Heidelberg, Germany                                                 *

 *      U. of Bonn, Germany                                                       *

 *                                                                                *

 * Redistribution and use in source and binary forms, with or without             *

 * modification, are permitted according to the terms listed in LICENSE           *

 * (http://tmva.sourceforge.net/LICENSE)                                          *

 **********************************************************************************/


#ifndef TMVA_DNN_TENSORDATALOADER

#define TMVA_DNN_TENSORDATALOADER


#include "TMatrix.h"

#include "TMVA/Event.h"

#include <algorithm>


namespace TMVA {

   class DataSetInfo;

namespace DNN {


//

// Input Data Types

//______________________________________________________________________________

using TensorInput =

   std::tuple<const std::vector<TMatrixT<Double_t>> &, const TMatrixT<Double_t> &, const TMatrixT<Double_t> &>;


using TMVAInput_t =  std::tuple<const std::vector<Event *> &, const DataSetInfo &>;

using IndexIterator_t = typename std::vector<size_t>::iterator;


/** TTensorBatch

 *

 * Class representing training batches consisting of a vector of matrices as input data

 * and a matrix of output data. The input and output data can be accessed using

 * the GetInput() and GetOutput() member functions.

 *

 * \tparam Architecture_t The underlying architecture.

 */


template <typename Architecture_t>

class TTensorBatch {

public:

   using Matrix_t = typename Architecture_t::Matrix_t;


private:

   std::vector<Matrix_t> fInputTensor; ///< The input tensor batch, one matrix one input.

   Matrix_t fOutputMatrix;             ///< The output matrix representing the ground truth.

   Matrix_t fWeightMatrix;


public:

   TTensorBatch(std::vector<Matrix_t> &, Matrix_t &, Matrix_t &);

   TTensorBatch(const TTensorBatch &) = default;

   TTensorBatch(TTensorBatch &&) = default;

   TTensorBatch &operator=(const TTensorBatch &) = default;

   TTensorBatch &operator=(TTensorBatch &&) = default;


   /** Return the tensor representing the input data */

   std::vector<Matrix_t> &GetInput() { return fInputTensor; }

   /** Return the matrix representing the output data. */

   Matrix_t &GetOutput() { return fOutputMatrix; }

   /** Return the matrix holding the event weights. */

   Matrix_t &GetWeights() { return fWeightMatrix; }

};


template <typename Data_t, typename Architecture_t>

class TTensorDataLoader;


/** TTensorBatchIterator

 *

 * Simple iterator class for the iterations over the training batches in

 * a given data set represented by a TTensorDataLoader object.

 *

 * \tparam Data_t         The input data type.

 * \tparam Architecture_t The underlying architecture type.

 */

template <typename Data_t, typename Architecture_t>

class TTensorBatchIterator {

private:

   TTensorDataLoader<Data_t, Architecture_t> &fTensorDataLoader;

   size_t fBatchIndex;


public:

   TTensorBatchIterator(TTensorDataLoader<Data_t, Architecture_t> &tensorDataLoader, size_t index = 0)

      : fTensorDataLoader(tensorDataLoader), fBatchIndex(index)

   {

      // Nothing to do here.

   }


   TTensorBatch<Architecture_t> operator*() { return fTensorDataLoader.GetTensorBatch(); }

   TTensorBatchIterator operator++()

   {

      fBatchIndex++;

      return *this;

   }

   bool operator!=(const TTensorBatchIterator &other) { return fBatchIndex != other.fBatchIndex; }

};


/** TTensorDataLoader

 *

 * Service class managing the streaming of the training data from the input data

 * type to the accelerator device or the CPU. A TTensorDataLoader object manages

 * a number of host and device buffer pairs that are used in a round-robin manner

 * for the transfer of batches to the device.

 *

 * Each TTensorDataLoader object has an associated batch size and a number of total

 * samples in the dataset. One epoch is the number of buffers required to transfer

 * the complete training set. Using the begin() and end() member functions allows

 * the user to iterate over the batches in one epoch.

 *

 * \tparam Data_t The input data type.

 * \tparam Architecture_t The achitecture class of the underlying architecture.

 */

template <typename Data_t, typename Architecture_t>

class TTensorDataLoader {

private:

   using HostBuffer_t = typename Architecture_t::HostBuffer_t;

   using DeviceBuffer_t = typename Architecture_t::DeviceBuffer_t;

   using Matrix_t = typename Architecture_t::Matrix_t;

   using BatchIterator_t = TTensorBatchIterator<Data_t, Architecture_t>;


   const Data_t &fData; ///< The data that should be loaded in the batches.


   size_t fNSamples;        ///< The total number of samples in the dataset.

   size_t fBatchSize;       ///< The size of a batch.

   size_t fBatchDepth;      ///< The number of matrices in the tensor.

   size_t fBatchHeight;     ///< The number od rows in each matrix.

   size_t fBatchWidth;      ///< The number of columns in each matrix.

   size_t fNOutputFeatures; ///< The number of outputs from the classifier/regressor.

   size_t fBatchIndex;      ///< The index of the batch when there are multiple batches in parallel


   size_t fNStreams;                           ///< Number of buffer pairs.

   std::vector<DeviceBuffer_t> fDeviceBuffers; ///< The device buffers used to keep the input, output and weight data.

   std::vector<HostBuffer_t> fHostBuffers;     ///< The host buffers used to load the input, output and weight data.


   std::vector<size_t> fSampleIndices; ///< Ordering of the samples in the epoch.


public:

   /*! Constructor. */

   TTensorDataLoader(const Data_t &data, size_t nSamples, size_t batchSize, size_t batchDepth, size_t batchHeight,

                     size_t batchWidth, size_t nOutputFeatures, size_t nStreams = 1);


   TTensorDataLoader(const TTensorDataLoader &) = default;

   TTensorDataLoader(TTensorDataLoader &&) = default;

   TTensorDataLoader &operator=(const TTensorDataLoader &) = default;

   TTensorDataLoader &operator=(TTensorDataLoader &&) = default;


   /** Copy input tensor into the given host buffer. Function to be specialized by

    *  the architecture-specific backend. */

   void CopyTensorInput(HostBuffer_t &buffer, IndexIterator_t begin);

   /** Copy output matrix into the given host buffer. Function to be specialized

    * by the architecture-spcific backend. */

   void CopyTensorOutput(HostBuffer_t &buffer, IndexIterator_t begin);

   /** Copy weight matrix into the given host buffer. Function to be specialized

    * by the architecture-spcific backend. */

   void CopyTensorWeights(HostBuffer_t &buffer, IndexIterator_t begin);


   BatchIterator_t begin() { return TTensorBatchIterator<Data_t, Architecture_t>(*this); }

   BatchIterator_t end() { return TTensorBatchIterator<Data_t, Architecture_t>(*this, fNSamples / fBatchSize); }


   /** Shuffle the order of the samples in the batch. The shuffling is indirect,

    *  i.e. only the indices are shuffled. No input data is moved by this

    * routine. */

   template<typename RNG>

   void Shuffle(RNG & rng);


   /** Return the next batch from the training set. The TTensorDataLoader object

    *  keeps an internal counter that cycles over the batches in the training

    *  set. */

   TTensorBatch<Architecture_t> GetTensorBatch();

};


//

// TTensorBatch Class.

//______________________________________________________________________________

template <typename Architecture_t>

TTensorBatch<Architecture_t>::TTensorBatch(std::vector<Matrix_t> &inputTensor, Matrix_t &outputMatrix,

                                           Matrix_t &weightMatrix)

   : fInputTensor(inputTensor), fOutputMatrix(outputMatrix), fWeightMatrix(weightMatrix)

{

   // Nothing to do here.

}


//

// TTensorDataLoader Class.

//______________________________________________________________________________

template <typename Data_t, typename Architecture_t>

TTensorDataLoader<Data_t, Architecture_t>::TTensorDataLoader(const Data_t &data, size_t nSamples, size_t batchSize,

                                                             size_t batchDepth, size_t batchHeight, size_t batchWidth,

                                                             size_t nOutputFeatures, size_t nStreams)

   : fData(data), fNSamples(nSamples), fBatchSize(batchSize), fBatchDepth(batchDepth), fBatchHeight(batchHeight),

     fBatchWidth(batchWidth), fNOutputFeatures(nOutputFeatures), fBatchIndex(0), fNStreams(nStreams), fDeviceBuffers(),

     fHostBuffers(), fSampleIndices()

{

   size_t inputTensorSize = fBatchDepth * fBatchHeight * fBatchWidth;

   size_t outputMatrixSize = fBatchSize * fNOutputFeatures;

   size_t weightMatrixSize = fBatchSize;


   for (size_t i = 0; i < fNStreams; i++) {

      fHostBuffers.push_back(HostBuffer_t(inputTensorSize + outputMatrixSize + weightMatrixSize));

      fDeviceBuffers.push_back(DeviceBuffer_t(inputTensorSize + outputMatrixSize + weightMatrixSize));

   }


   fSampleIndices.reserve(fNSamples);

   for (size_t i = 0; i < fNSamples; i++) {

      fSampleIndices.push_back(i);

   }

}


//______________________________________________________________________________

template <typename Data_t, typename Architecture_t>

TTensorBatch<Architecture_t> TTensorDataLoader<Data_t, Architecture_t>::GetTensorBatch()

{

   fBatchIndex %= (fNSamples / fBatchSize); // Cycle through samples.


   size_t inputTensorSize = fBatchDepth * fBatchHeight * fBatchWidth;

   size_t outputMatrixSize = fBatchSize * fNOutputFeatures;

   size_t weightMatrixSize = fBatchSize;


   size_t streamIndex = fBatchIndex % fNStreams;

   HostBuffer_t &hostBuffer = fHostBuffers[streamIndex];

   DeviceBuffer_t &deviceBuffer = fDeviceBuffers[streamIndex];


   HostBuffer_t inputHostBuffer = hostBuffer.GetSubBuffer(0, inputTensorSize);

   HostBuffer_t outputHostBuffer = hostBuffer.GetSubBuffer(inputTensorSize, outputMatrixSize);

   HostBuffer_t weightHostBuffer = hostBuffer.GetSubBuffer(inputTensorSize + outputMatrixSize, weightMatrixSize);


   DeviceBuffer_t inputDeviceBuffer = deviceBuffer.GetSubBuffer(0, inputTensorSize);

   DeviceBuffer_t outputDeviceBuffer = deviceBuffer.GetSubBuffer(inputTensorSize, outputMatrixSize);

   DeviceBuffer_t weightDeviceBuffer = deviceBuffer.GetSubBuffer(inputTensorSize + outputMatrixSize, weightMatrixSize);


   // here sample index has batch size as offset , while in

   // copy tensor input has batch depth.

   // We support then now two cases: batchdepth = 1  batchHeight = batch size

   //   or batch depth = batch size

   size_t sampleIndex = fBatchIndex * fBatchSize;

   IndexIterator_t sampleIndexIterator = fSampleIndices.begin() + sampleIndex;


   CopyTensorInput(inputHostBuffer, sampleIndexIterator);

   CopyTensorOutput(outputHostBuffer, sampleIndexIterator);

   CopyTensorWeights(weightHostBuffer, sampleIndexIterator);


   deviceBuffer.CopyFrom(hostBuffer);


   std::vector<Matrix_t> inputTensor;

   size_t jump = fBatchHeight * fBatchWidth;

   for (size_t i = 0; i < fBatchDepth; i++) {

      DeviceBuffer_t subInputDeviceBuffer = inputDeviceBuffer.GetSubBuffer(i * jump, jump);

      inputTensor.emplace_back(subInputDeviceBuffer, fBatchHeight, fBatchWidth);

   }

   Matrix_t outputMatrix(outputDeviceBuffer, fBatchSize, fNOutputFeatures);

   Matrix_t weightMatrix(weightDeviceBuffer, fBatchSize, fNOutputFeatures);


   fBatchIndex++;

   return TTensorBatch<Architecture_t>(inputTensor, outputMatrix, weightMatrix);

}


//______________________________________________________________________________

template <typename Data_t, typename Architecture_t>

template <typename RNG>

void TTensorDataLoader<Data_t, Architecture_t>::Shuffle(RNG & rng)

{

   std::shuffle(fSampleIndices.begin(), fSampleIndices.end(), rng);

}


} // namespace DNN

} // namespace TMVA


#endif

Event.h

TMatrix.h

TMVA::DNN::TTensorBatchIterator
TTensorBatchIterator.
Definition: TensorDataLoader.h:93

TMVA::DNN::TTensorBatchIterator::fBatchIndex
size_t fBatchIndex
Definition: TensorDataLoader.h:96

TMVA::DNN::TTensorBatchIterator::TTensorBatchIterator
TTensorBatchIterator(TTensorDataLoader< Data_t, Architecture_t > &tensorDataLoader, size_t index=0)
Definition: TensorDataLoader.h:99

TMVA::DNN::TTensorBatchIterator::operator*
TTensorBatch< Architecture_t > operator*()
Definition: TensorDataLoader.h:105

TMVA::DNN::TTensorBatchIterator::operator!=
bool operator!=(const TTensorBatchIterator &other)
Definition: TensorDataLoader.h:111

TMVA::DNN::TTensorBatchIterator::fTensorDataLoader
TTensorDataLoader< Data_t, Architecture_t > & fTensorDataLoader
Definition: TensorDataLoader.h:95

TMVA::DNN::TTensorBatchIterator::operator++
TTensorBatchIterator operator++()
Definition: TensorDataLoader.h:106

TMVA::DNN::TTensorBatch
TTensorBatch.
Definition: TensorDataLoader.h:57

TMVA::DNN::TTensorBatch::GetInput
std::vector< Matrix_t > & GetInput()
Return the tensor representing the input data.
Definition: TensorDataLoader.h:74

TMVA::DNN::TTensorBatch::operator=
TTensorBatch & operator=(const TTensorBatch &)=default

TMVA::DNN::TTensorBatch::TTensorBatch
TTensorBatch(TTensorBatch &&)=default

TMVA::DNN::TTensorBatch::fWeightMatrix
Matrix_t fWeightMatrix
Definition: TensorDataLoader.h:64

TMVA::DNN::TTensorBatch::operator=
TTensorBatch & operator=(TTensorBatch &&)=default

TMVA::DNN::TTensorBatch::GetWeights
Matrix_t & GetWeights()
Return the matrix holding the event weights.
Definition: TensorDataLoader.h:78

TMVA::DNN::TTensorBatch::TTensorBatch
TTensorBatch(std::vector< Matrix_t > &, Matrix_t &, Matrix_t &)
Definition: TensorDataLoader.h:192

TMVA::DNN::TTensorBatch::GetOutput
Matrix_t & GetOutput()
Return the matrix representing the output data.
Definition: TensorDataLoader.h:76

TMVA::DNN::TTensorBatch::TTensorBatch
TTensorBatch(const TTensorBatch &)=default

TMVA::DNN::TTensorBatch::fInputTensor
std::vector< Matrix_t > fInputTensor
The input tensor batch, one matrix one input.
Definition: TensorDataLoader.h:62

TMVA::DNN::TTensorBatch::fOutputMatrix
Matrix_t fOutputMatrix
The output matrix representing the ground truth.
Definition: TensorDataLoader.h:63

TMVA::DNN::TTensorBatch::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition: TensorDataLoader.h:59

TMVA::DNN::TTensorDataLoader
TTensorDataLoader.
Definition: TensorDataLoader.h:130

TMVA::DNN::TTensorDataLoader::TTensorDataLoader
TTensorDataLoader(const TTensorDataLoader &)=default

TMVA::DNN::TTensorDataLoader::Shuffle
void Shuffle(RNG &rng)
Shuffle the order of the samples in the batch.
Definition: TensorDataLoader.h:276

TMVA::DNN::TTensorDataLoader::fNOutputFeatures
size_t fNOutputFeatures
The number of outputs from the classifier/regressor.
Definition: TensorDataLoader.h:144

TMVA::DNN::TTensorDataLoader::fSampleIndices
std::vector< size_t > fSampleIndices
Ordering of the samples in the epoch.
Definition: TensorDataLoader.h:151

TMVA::DNN::TTensorDataLoader::fDeviceBuffers
std::vector< DeviceBuffer_t > fDeviceBuffers
The device buffers used to keep the input, output and weight data.
Definition: TensorDataLoader.h:148

TMVA::DNN::TTensorDataLoader::GetTensorBatch
TTensorBatch< Architecture_t > GetTensorBatch()
Return the next batch from the training set.
Definition: TensorDataLoader.h:227

TMVA::DNN::TTensorDataLoader::operator=
TTensorDataLoader & operator=(const TTensorDataLoader &)=default

TMVA::DNN::TTensorDataLoader::DeviceBuffer_t
typename Architecture_t::DeviceBuffer_t DeviceBuffer_t
Definition: TensorDataLoader.h:133

TMVA::DNN::TTensorDataLoader::fBatchWidth
size_t fBatchWidth
The number of columns in each matrix.
Definition: TensorDataLoader.h:143

TMVA::DNN::TTensorDataLoader::CopyTensorOutput
void CopyTensorOutput(HostBuffer_t &buffer, IndexIterator_t begin)
Copy output matrix into the given host buffer.

TMVA::DNN::TTensorDataLoader::fBatchIndex
size_t fBatchIndex
The index of the batch when there are multiple batches in parallel.
Definition: TensorDataLoader.h:145

TMVA::DNN::TTensorDataLoader::fBatchHeight
size_t fBatchHeight
The number od rows in each matrix.
Definition: TensorDataLoader.h:142

TMVA::DNN::TTensorDataLoader::fHostBuffers
std::vector< HostBuffer_t > fHostBuffers
The host buffers used to load the input, output and weight data.
Definition: TensorDataLoader.h:149

TMVA::DNN::TTensorDataLoader::begin
BatchIterator_t begin()
Definition: TensorDataLoader.h:173

TMVA::DNN::TTensorDataLoader::TTensorDataLoader
TTensorDataLoader(TTensorDataLoader &&)=default

TMVA::DNN::TTensorDataLoader::fBatchSize
size_t fBatchSize
The size of a batch.
Definition: TensorDataLoader.h:140

TMVA::DNN::TTensorDataLoader::CopyTensorWeights
void CopyTensorWeights(HostBuffer_t &buffer, IndexIterator_t begin)
Copy weight matrix into the given host buffer.

TMVA::DNN::TTensorDataLoader::Matrix_t
typename Architecture_t::Matrix_t Matrix_t
Definition: TensorDataLoader.h:134

TMVA::DNN::TTensorDataLoader::HostBuffer_t
typename Architecture_t::HostBuffer_t HostBuffer_t
Definition: TensorDataLoader.h:132

TMVA::DNN::TTensorDataLoader::fBatchDepth
size_t fBatchDepth
The number of matrices in the tensor.
Definition: TensorDataLoader.h:141

TMVA::DNN::TTensorDataLoader::fNStreams
size_t fNStreams
Number of buffer pairs.
Definition: TensorDataLoader.h:147

TMVA::DNN::TTensorDataLoader::fData
const Data_t & fData
The data that should be loaded in the batches.
Definition: TensorDataLoader.h:137

TMVA::DNN::TTensorDataLoader::operator=
TTensorDataLoader & operator=(TTensorDataLoader &&)=default

TMVA::DNN::TTensorDataLoader::end
BatchIterator_t end()
Definition: TensorDataLoader.h:174

TMVA::DNN::TTensorDataLoader::fNSamples
size_t fNSamples
The total number of samples in the dataset.
Definition: TensorDataLoader.h:139

TMVA::DNN::TTensorDataLoader::TTensorDataLoader
TTensorDataLoader(const Data_t &data, size_t nSamples, size_t batchSize, size_t batchDepth, size_t batchHeight, size_t batchWidth, size_t nOutputFeatures, size_t nStreams=1)
Constructor.
Definition: TensorDataLoader.h:203

TMVA::DNN::TTensorDataLoader::CopyTensorInput
void CopyTensorInput(HostBuffer_t &buffer, IndexIterator_t begin)
Copy input tensor into the given host buffer.

TMVA::DataSetInfo
Class that contains all the data information.
Definition: DataSetInfo.h:60

TMatrixT< Double_t >

TMVA::DNN::TensorInput
std::tuple< const std::vector< TMatrixT< Double_t > > &, const TMatrixT< Double_t > &, const TMatrixT< Double_t > & > TensorInput
Definition: TensorDataLoader.h:42

TMVA::DNN::IndexIterator_t
typename std::vector< size_t >::iterator IndexIterator_t
Definition: DataLoader.h:42

TMVA::DNN::TMVAInput_t
std::tuple< const std::vector< Event * > &, const DataSetInfo & > TMVAInput_t
Definition: DataLoader.h:40

TMVA
create variable transformations
Definition: GeneticMinimizer.h:21