doc/v614/Architectures_2Reference_2TensorDataLoader_8h_source.html

 // @(#)root/tmva/tmva/dnn:$Id$
 // Author: Vladimir Ilievski

 /**********************************************************************************
  * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *
  * Package: TMVA                                                                  *
  * Class  : TTensorDataLoader                                                     *
  * Web    : http://tmva.sourceforge.net                                           *
  *                                                                                *
  * Description:                                                                   *
  *      Specialization of the Tensor Data Loader Class                            *
  *                                                                                *
  * Authors (alphabetical):                                                        *
  *      Vladimir Ilievski      <ilievski.vladimir@live.com>  - CERN, Switzerland  *
  *                                                                                *
  * Copyright (c) 2005-2015:                                                       *
  *      CERN, Switzerland                                                         *
  *      U. of Victoria, Canada                                                    *
  *      MPI-K Heidelberg, Germany                                                 *
  *      U. of Bonn, Germany                                                       *
  *                                                                                *
  * Redistribution and use in source and binary forms, with or without             *
  * modification, are permitted according to the terms listed in LICENSE           *
  * (http://tmva.sourceforge.net/LICENSE)                                          *
  **********************************************************************************/

 //////////////////////////////////////////////////////////////////////////
 // Partial specialization of the TTensorDataLoader class to adapt       //
 // it to the TMatrix class. Also the data transfer is kept simple,      //
 // since this implementation (being intended as reference and fallback) //
 // is not optimized for performance.                                    //
 //////////////////////////////////////////////////////////////////////////

 #ifndef TMVA_DNN_ARCHITECTURES_REFERENCE_TENSORDATALOADER
 #define TMVA_DNN_ARCHITECTURES_REFERENCE_TENSORDATALOADER

 #include "TMVA/DNN/TensorDataLoader.h"
 #include <iostream>

 namespace TMVA {
 namespace DNN {

 template <typename AReal>
 class TReference;

 template <typename AData, typename AReal>
 class TTensorDataLoader<AData, TReference<AReal>> {
 private:
    using BatchIterator_t = TTensorBatchIterator<AData, TReference<AReal>>;

    const AData &fData; ///< The data that should be loaded in the batches.

    size_t fNSamples;        ///< The total number of samples in the dataset.
    size_t fBatchSize;       ///< The size of a batch.
    size_t fBatchDepth;      ///< The number of matrices in the tensor.
    size_t fBatchHeight;     ///< The number od rows in each matrix.
    size_t fBatchWidth;      ///< The number of columns in each matrix.
    size_t fNOutputFeatures; ///< The number of outputs from the classifier/regressor.
    size_t fBatchIndex;      ///< The index of the batch when there are multiple batches in parallel.

    std::vector<TMatrixT<AReal>> inputTensor; ///< The 3D tensor used to keep the input data.
    TMatrixT<AReal> outputMatrix;             ///< The matrix used to keep the output.
    TMatrixT<AReal> weightMatrix;             ///< The matrix used to keep the batch weights.

    std::vector<size_t> fSampleIndices; ///< Ordering of the samples in the epoch.

 public:
    /*! Constructor. */
    TTensorDataLoader(const AData &data, size_t nSamples, size_t batchSize, size_t batchDepth, size_t batchHeight,
                      size_t batchWidth, size_t nOutputFeatures, size_t nStreams = 1);

    TTensorDataLoader(const TTensorDataLoader &) = default;
    TTensorDataLoader(TTensorDataLoader &&) = default;
    TTensorDataLoader &operator=(const TTensorDataLoader &) = default;
    TTensorDataLoader &operator=(TTensorDataLoader &&) = default;

    /** Copy input tensor into the given host buffer. Function to be specialized by
     *  the architecture-specific backend. */
    void CopyTensorInput(std::vector<TMatrixT<AReal>> &tensor, IndexIterator_t sampleIterator);
    /** Copy output matrix into the given host buffer. Function to be specialized
     * by the architecture-spcific backend. */
    void CopyTensorOutput(TMatrixT<AReal> &matrix, IndexIterator_t sampleIterator);
    /** Copy weight matrix into the given host buffer. Function to be specialized
     * by the architecture-spcific backend. */
    void CopyTensorWeights(TMatrixT<AReal> &matrix, IndexIterator_t sampleIterator);

    BatchIterator_t begin() { return BatchIterator_t(*this); }
    BatchIterator_t end() { return BatchIterator_t(*this, fNSamples / fBatchSize); }

    /** Shuffle the order of the samples in the batch. The shuffling is indirect,
     *  i.e. only the indices are shuffled. No input data is moved by this
     * routine. */
    template<typename RNG>
    void Shuffle(RNG & rng);

    /** Return the next batch from the training set. The TTensorDataLoader object
     *  keeps an internal counter that cycles over the batches in the training
     *  set. */
    TTensorBatch<TReference<AReal>> GetTensorBatch();
 };

 //
 // TTensorDataLoader Class.
 //______________________________________________________________________________
 template <typename AData, typename AReal>
 TTensorDataLoader<AData, TReference<AReal>>::TTensorDataLoader(const AData &data, size_t nSamples, size_t batchSize,
                                                                size_t batchDepth, size_t batchHeight, size_t batchWidth,
                                                                size_t nOutputFeatures, size_t /* nStreams */)
    : fData(data), fNSamples(nSamples), fBatchSize(batchSize), fBatchDepth(batchDepth), fBatchHeight(batchHeight),
      fBatchWidth(batchWidth), fNOutputFeatures(nOutputFeatures), fBatchIndex(0), inputTensor(),
      outputMatrix(batchSize, nOutputFeatures), weightMatrix(batchSize, 1), fSampleIndices()
 {

    inputTensor.reserve(batchDepth);
    for (size_t i = 0; i < batchDepth; i++) {
       inputTensor.emplace_back(batchHeight, batchWidth);
    }

    fSampleIndices.reserve(fNSamples);
    for (size_t i = 0; i < fNSamples; i++) {
       fSampleIndices.push_back(i);
    }
 }

 template <typename AData, typename AReal>
 template <typename RNG>
 void TTensorDataLoader<AData, TReference<AReal>>::Shuffle(RNG & rng)
 {
    std::shuffle(fSampleIndices.begin(), fSampleIndices.end(), rng);
 }

 template <typename AData, typename AReal>
 auto TTensorDataLoader<AData, TReference<AReal>>::GetTensorBatch() -> TTensorBatch<TReference<AReal>>
 {
    fBatchIndex %= (fNSamples / fBatchSize); // Cycle through samples.

    size_t sampleIndex = fBatchIndex * fBatchSize;
    IndexIterator_t sampleIndexIterator = fSampleIndices.begin() + sampleIndex;

    CopyTensorInput(inputTensor, sampleIndexIterator);
    CopyTensorOutput(outputMatrix, sampleIndexIterator);
    CopyTensorWeights(weightMatrix, sampleIndexIterator);

    fBatchIndex++;
    return TTensorBatch<TReference<AReal>>(inputTensor, outputMatrix, weightMatrix);
 }

 } // namespace DNN
 } // namespace TMVA

 #endif
ApplicationClassificationKeras.data
data
Definition: ApplicationClassificationKeras.py:17

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::weightMatrix
TMatrixT< AReal > weightMatrix
The matrix used to keep the batch weights.
Definition: TensorDataLoader.h:63

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fSampleIndices
std::vector< size_t > fSampleIndices
Ordering of the samples in the epoch.
Definition: TensorDataLoader.h:65

TMVA::DNN::TTensorDataLoader::CopyTensorInput
void CopyTensorInput(HostBuffer_t &buffer, IndexIterator_t begin)
Copy input tensor into the given host buffer.

TMVA::DNN::TTensorBatchIterator
TTensorBatchIterator.
Definition: TensorDataLoader.h:93

TMVA::DNN::TTensorDataLoader
TTensorDataLoader.
Definition: TensorDataLoader.h:82

TMatrixT< AReal >

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::end
BatchIterator_t end()
Definition: TensorDataLoader.h:88

TMVA::DNN::TReference
The reference architecture class.
Definition: DataLoader.h:30

TMVA::DNN::TTensorDataLoader::GetTensorBatch
TTensorBatch< Architecture_t > GetTensorBatch()
Return the next batch from the training set.
Definition: TensorDataLoader.h:227

TMVA::DNN::TTensorDataLoader::fBatchHeight
size_t fBatchHeight
The number od rows in each matrix.
Definition: TensorDataLoader.h:142

TMVA::DNN::IndexIterator_t
typename std::vector< size_t >::iterator IndexIterator_t
Definition: DataLoader.h:42

TMVA::DNN::TTensorDataLoader::fBatchIndex
size_t fBatchIndex
The index of the batch when there are multiple batches in parallel.
Definition: TensorDataLoader.h:145

TMVA::DNN::TTensorDataLoader::CopyTensorWeights
void CopyTensorWeights(HostBuffer_t &buffer, IndexIterator_t begin)
Copy weight matrix into the given host buffer.

TMVA::DNN::TTensorDataLoader::TTensorDataLoader
TTensorDataLoader(const Data_t &data, size_t nSamples, size_t batchSize, size_t batchDepth, size_t batchHeight, size_t batchWidth, size_t nOutputFeatures, size_t nStreams=1)
Constructor.
Definition: TensorDataLoader.h:203

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fBatchWidth
size_t fBatchWidth
The number of columns in each matrix.
Definition: TensorDataLoader.h:57

TMVA::DNN::TTensorDataLoader::CopyTensorOutput
void CopyTensorOutput(HostBuffer_t &buffer, IndexIterator_t begin)
Copy output matrix into the given host buffer.

TMVA::DNN::TTensorBatch
TTensorBatch.
Definition: TensorDataLoader.h:57

TMVA::DNN::TTensorDataLoader::fBatchDepth
size_t fBatchDepth
The number of matrices in the tensor.
Definition: TensorDataLoader.h:141

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fBatchSize
size_t fBatchSize
The size of a batch.
Definition: TensorDataLoader.h:54

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fBatchIndex
size_t fBatchIndex
The index of the batch when there are multiple batches in parallel.
Definition: TensorDataLoader.h:59

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fNOutputFeatures
size_t fNOutputFeatures
The number of outputs from the classifier/regressor.
Definition: TensorDataLoader.h:58

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::outputMatrix
TMatrixT< AReal > outputMatrix
The matrix used to keep the output.
Definition: TensorDataLoader.h:62

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fData
const AData & fData
The data that should be loaded in the batches.
Definition: TensorDataLoader.h:51

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::begin
BatchIterator_t begin()
Definition: TensorDataLoader.h:87

TMVA::DNN::TTensorDataLoader::Shuffle
void Shuffle(RNG &rng)
Shuffle the order of the samples in the batch.
Definition: TensorDataLoader.h:276

TMVA::DNN::TTensorDataLoader::operator=
TTensorDataLoader & operator=(const TTensorDataLoader &)=default

TMVA::DNN::TTensorDataLoader::BatchIterator_t
TTensorBatchIterator< Data_t, Architecture_t > BatchIterator_t
Definition: TensorDataLoader.h:135

TensorDataLoader.h

TMVA
Abstract ClassifierFactory template that handles arbitrary types.
Definition: GeneticMinimizer.h:21

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fNSamples
size_t fNSamples
The total number of samples in the dataset.
Definition: TensorDataLoader.h:53

TMVA::DNN::TTensorDataLoader::fNSamples
size_t fNSamples
The total number of samples in the dataset.
Definition: TensorDataLoader.h:139

TMVA::DNN::TTensorDataLoader::fBatchWidth
size_t fBatchWidth
The number of columns in each matrix.
Definition: TensorDataLoader.h:143

TMVA::DNN::TTensorDataLoader::fBatchSize
size_t fBatchSize
The size of a batch.
Definition: TensorDataLoader.h:140

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fBatchDepth
size_t fBatchDepth
The number of matrices in the tensor.
Definition: TensorDataLoader.h:55

TMVA::DNN::TTensorDataLoader::fData
const Data_t & fData
The data that should be loaded in the batches.
Definition: TensorDataLoader.h:137

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fBatchHeight
size_t fBatchHeight
The number od rows in each matrix.
Definition: TensorDataLoader.h:56

TMVA::DNN::TTensorDataLoader::fNOutputFeatures
size_t fNOutputFeatures
The number of outputs from the classifier/regressor.
Definition: TensorDataLoader.h:144

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::inputTensor
std::vector< TMatrixT< AReal > > inputTensor
The 3D tensor used to keep the input data.
Definition: TensorDataLoader.h:61

TMVA::DNN::TTensorDataLoader::fSampleIndices
std::vector< size_t > fSampleIndices
Ordering of the samples in the epoch.
Definition: TensorDataLoader.h:151