doc/master/Architectures_2Reference_2TensorDataLoader_8h_source.html

// @(#)root/tmva/tmva/dnn:$Id$

// Author: Vladimir Ilievski


/**********************************************************************************

 * Project: TMVA - a Root-integrated toolkit for multivariate data analysis       *

 * Package: TMVA                                                                  *

 * Class  : TTensorDataLoader                                                     *

 *                                             *

 *                                                                                *

 * Description:                                                                   *

 *      Specialization of the Tensor Data Loader Class                            *

 *                                                                                *

 * Authors (alphabetical):                                                        *

 *      Vladimir Ilievski      <ilievski.vladimir@live.com>  - CERN, Switzerland  *

 *                                                                                *

 * Copyright (c) 2005-2015:                                                       *

 *      CERN, Switzerland                                                         *

 *      U. of Victoria, Canada                                                    *

 *      MPI-K Heidelberg, Germany                                                 *

 *      U. of Bonn, Germany                                                       *

 *                                                                                *

 * Redistribution and use in source and binary forms, with or without             *

 * modification, are permitted according to the terms listed in LICENSE           *

 * (see tmva/doc/LICENSE)                                          *

 **********************************************************************************/


//////////////////////////////////////////////////////////////////////////

// Partial specialization of the TTensorDataLoader class to adapt       //

// it to the TMatrix class. Also the data transfer is kept simple,      //

// since this implementation (being intended as reference and fallback) //

// is not optimized for performance.                                    //

//////////////////////////////////////////////////////////////////////////


#ifndef TMVA_DNN_ARCHITECTURES_REFERENCE_TENSORDATALOADER

#define TMVA_DNN_ARCHITECTURES_REFERENCE_TENSORDATALOADER


#include "TMVA/DNN/TensorDataLoader.h"

#include <iostream>


namespace TMVA {

namespace DNN {


template <typename AReal>

class TReference;


template <typename AData, typename AReal>

class TTensorDataLoader<AData, TReference<AReal>> {

private:

   using BatchIterator_t = TTensorBatchIterator<AData, TReference<AReal>>;


   const AData &fData;      ///< The data that should be loaded in the batches.


   size_t fNSamples;        ///< The total number of samples in the dataset.

   //size_t fBatchSize;     ///< The size of a batch.

   size_t fBatchDepth;      ///< The number of matrices in the tensor.

   size_t fBatchHeight;     ///< The number od rows in each matrix.

   size_t fBatchWidth;      ///< The number of columns in each matrix.

   size_t fNOutputFeatures; ///< The number of outputs from the classifier/regressor.

   size_t fBatchIndex;      ///< The index of the batch when there are multiple batches in parallel.


   std::vector<size_t> fInputShape;     ///< Defines the batch depth, no. of channels and spatial dimensions of an input tensor


   std::vector<TMatrixT<AReal>> inputTensor; ///< The 3D tensor used to keep the input data.

   TMatrixT<AReal> outputMatrix;             ///< The matrix used to keep the output.

   TMatrixT<AReal> weightMatrix;             ///< The matrix used to keep the batch weights.


   std::vector<size_t> fSampleIndices; ///< Ordering of the samples in the epoch.


public:

   /*! Constructor. */

   TTensorDataLoader(const AData &data, size_t nSamples, size_t batchDepth,

                     size_t batchHeight, size_t batchWidth, size_t nOutputFeatures,

                     std::vector<size_t> inputShape, size_t nStreams = 1);


   TTensorDataLoader(const TTensorDataLoader &) = default;

   TTensorDataLoader(TTensorDataLoader &&) = default;

   TTensorDataLoader &operator=(const TTensorDataLoader &) = default;

   TTensorDataLoader &operator=(TTensorDataLoader &&) = default;


   /** Copy input tensor into the given host buffer. Function to be specialized by

    *  the architecture-specific backend. */

   void CopyTensorInput(std::vector<TMatrixT<AReal>> &tensor, IndexIterator_t sampleIterator);

   /** Copy output matrix into the given host buffer. Function to be specialized

    * by the architecture-specific backend. */

   void CopyTensorOutput(TMatrixT<AReal> &matrix, IndexIterator_t sampleIterator);

   /** Copy weight matrix into the given host buffer. Function to be specialized

    * by the architecture-specific backend. */

   void CopyTensorWeights(TMatrixT<AReal> &matrix, IndexIterator_t sampleIterator);


   BatchIterator_t begin() { return BatchIterator_t(*this); }

   BatchIterator_t end() { return BatchIterator_t(*this, fNSamples / fInputShape[0]); }


   /** Shuffle the order of the samples in the batch. The shuffling is indirect,

    *  i.e. only the indices are shuffled. No input data is moved by this

    * routine. */

   template<typename RNG>

   void Shuffle(RNG & rng);


   /** Return the next batch from the training set. The TTensorDataLoader object

    *  keeps an internal counter that cycles over the batches in the training

    *  set. */

   TTensorBatch<TReference<AReal>> GetTensorBatch();

};


//

// TTensorDataLoader Class.

//______________________________________________________________________________

template <typename AData, typename AReal>

TTensorDataLoader<AData, TReference<AReal>>::TTensorDataLoader(const AData &data, size_t nSamples, size_t batchDepth,

                                                               size_t batchHeight, size_t batchWidth, size_t nOutputFeatures,

                                                               std::vector<size_t> inputShape, size_t /* nStreams */)

   : fData(data), fNSamples(nSamples), fBatchDepth(batchDepth), fBatchHeight(batchHeight),

     fBatchWidth(batchWidth), fNOutputFeatures(nOutputFeatures), fBatchIndex(0), fInputShape(std::move(inputShape)), inputTensor(),

     outputMatrix(inputShape[0], nOutputFeatures), weightMatrix(inputShape[0], 1), fSampleIndices()

{


   inputTensor.reserve(fBatchDepth);

   for (size_t i = 0; i < fBatchDepth; i++) {

      inputTensor.emplace_back(batchHeight, batchWidth);

   }


   fSampleIndices.reserve(fNSamples);

   for (size_t i = 0; i < fNSamples; i++) {

      fSampleIndices.push_back(i);

   }

}


template <typename AData, typename AReal>

template <typename RNG>

void TTensorDataLoader<AData, TReference<AReal>>::Shuffle(RNG & rng)

{

   std::shuffle(fSampleIndices.begin(), fSampleIndices.end(), rng);

}


template <typename AData, typename AReal>

auto TTensorDataLoader<AData, TReference<AReal>>::GetTensorBatch() -> TTensorBatch<TReference<AReal>>

{

   fBatchIndex %= (fNSamples / fInputShape[0]); // Cycle through samples.


   size_t sampleIndex = fBatchIndex * fInputShape[0];

   IndexIterator_t sampleIndexIterator = fSampleIndices.begin() + sampleIndex;


   CopyTensorInput(inputTensor, sampleIndexIterator);

   CopyTensorOutput(outputMatrix, sampleIndexIterator);

   CopyTensorWeights(weightMatrix, sampleIndexIterator);


   fBatchIndex++;

   return TTensorBatch<TReference<AReal>>(inputTensor, outputMatrix, weightMatrix);

}


} // namespace DNN

} // namespace TMVA


#endif

data
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void data
Definition TGWin32VirtualXProxy.cxx:104

TensorDataLoader.h

AReal

TMVA::DNN::TReference
The reference architecture class.
Definition Reference.h:53

TMVA::DNN::TTensorBatchIterator
TTensorBatchIterator.
Definition TensorDataLoader.h:96

TMVA::DNN::TTensorBatch
TTensorBatch.
Definition TensorDataLoader.h:59

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::operator=
TTensorDataLoader & operator=(const TTensorDataLoader &)=default

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::weightMatrix
TMatrixT< AReal > weightMatrix
The matrix used to keep the batch weights.
Definition TensorDataLoader.h:65

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::TTensorDataLoader
TTensorDataLoader(TTensorDataLoader &&)=default

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fBatchHeight
size_t fBatchHeight
The number od rows in each matrix.
Definition TensorDataLoader.h:56

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fData
const AData & fData
The data that should be loaded in the batches.
Definition TensorDataLoader.h:51

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::inputTensor
std::vector< TMatrixT< AReal > > inputTensor
The 3D tensor used to keep the input data.
Definition TensorDataLoader.h:63

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fNSamples
size_t fNSamples
The total number of samples in the dataset.
Definition TensorDataLoader.h:53

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::end
BatchIterator_t end()
Definition TensorDataLoader.h:91

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fInputShape
std::vector< size_t > fInputShape
Defines the batch depth, no. of channels and spatial dimensions of an input tensor.
Definition TensorDataLoader.h:61

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::CopyTensorInput
void CopyTensorInput(std::vector< TMatrixT< AReal > > &tensor, IndexIterator_t sampleIterator)
Copy input tensor into the given host buffer.

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fSampleIndices
std::vector< size_t > fSampleIndices
Ordering of the samples in the epoch.
Definition TensorDataLoader.h:67

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fBatchIndex
size_t fBatchIndex
The index of the batch when there are multiple batches in parallel.
Definition TensorDataLoader.h:59

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::outputMatrix
TMatrixT< AReal > outputMatrix
The matrix used to keep the output.
Definition TensorDataLoader.h:64

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::TTensorDataLoader
TTensorDataLoader(const TTensorDataLoader &)=default

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fBatchDepth
size_t fBatchDepth
The number of matrices in the tensor.
Definition TensorDataLoader.h:55

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fBatchWidth
size_t fBatchWidth
The number of columns in each matrix.
Definition TensorDataLoader.h:57

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::CopyTensorWeights
void CopyTensorWeights(TMatrixT< AReal > &matrix, IndexIterator_t sampleIterator)
Copy weight matrix into the given host buffer.

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::begin
BatchIterator_t begin()
Definition TensorDataLoader.h:90

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::operator=
TTensorDataLoader & operator=(TTensorDataLoader &&)=default

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::fNOutputFeatures
size_t fNOutputFeatures
The number of outputs from the classifier/regressor.
Definition TensorDataLoader.h:58

TMVA::DNN::TTensorDataLoader< AData, TReference< AReal > >::CopyTensorOutput
void CopyTensorOutput(TMatrixT< AReal > &matrix, IndexIterator_t sampleIterator)
Copy output matrix into the given host buffer.

TMVA::DNN::TTensorDataLoader
TTensorDataLoader.
Definition TensorDataLoader.h:133

TMVA::DNN::TTensorDataLoader::BatchIterator_t
TTensorBatchIterator< Data_t, Architecture_t > BatchIterator_t
Definition TensorDataLoader.h:140

TMVA::DNN::TTensorDataLoader::Shuffle
void Shuffle(RNG &rng)
Shuffle the order of the samples in the batch.
Definition TensorDataLoader.h:285

TMVA::DNN::TTensorDataLoader::fSampleIndices
std::vector< size_t > fSampleIndices
Ordering of the samples in the epoch.
Definition TensorDataLoader.h:157

TMVA::DNN::TTensorDataLoader::GetTensorBatch
TTensorBatch< Architecture_t > GetTensorBatch()
Return the next batch from the training set.
Definition TensorDataLoader.h:233

TMVA::DNN::TTensorDataLoader::fBatchDepth
size_t fBatchDepth
The number of matrices in the tensor.
Definition TensorDataLoader.h:146

TMVA::DNN::TTensorDataLoader::fNSamples
size_t fNSamples
The total number of samples in the dataset.
Definition TensorDataLoader.h:143

TMatrixT
TMatrixT.
Definition TMatrixT.h:40

TMVA::DNN::IndexIterator_t
typename std::vector< size_t >::iterator IndexIterator_t
Definition DataLoader.h:42

TMVA
create variable transformations
Definition GeneticMinimizer.h:22