25template <
typename AFloat>
 
   30   const AFloat *dataOutput = 
output.GetRawDataPointer();
 
   36   auto f = [&dataY, &dataOutput, &dataWeights, &temp, 
m](
UInt_t workerID) {
 
   37      AFloat dy = dataY[workerID] - dataOutput[workerID];
 
   38      temp[workerID] = dataWeights[workerID % 
m] * dy * dy;
 
   42   auto reduction = [](
const std::vector<AFloat> & 
v )
 
   44      return std::accumulate(
v.begin(),
v.end(),AFloat{});
 
   52template <
typename AFloat>
 
   59   const AFloat  *dataOutput = 
output.GetRawDataPointer();
 
   65   auto f = [&dataDY, &dataY, &dataOutput, &dataWeights, 
m, norm](
UInt_t workerID) {
 
   66      dataDY[workerID] = -2.0 * norm * (dataY[workerID] - dataOutput[workerID]);
 
   67      dataDY[workerID] *= dataWeights[workerID % 
m];
 
   75template <
typename AFloat>
 
   80   const AFloat *dataOutput = 
output.GetRawDataPointer();
 
   87   auto f = [&dataY, &dataOutput, &dataWeights, &temp, 
m](
UInt_t workerID) {
 
   88      AFloat 
y   = dataY[workerID];
 
   89      AFloat sig = 1.0 / (1.0 + 
exp(- dataOutput[workerID]));
 
   90      temp[workerID] = - (
y * 
log(sig) + (1.0 - 
y) * 
log(1.0 - sig));
 
   91      temp[workerID] *= dataWeights[workerID % 
m];
 
   95   auto reduction = [](
const std::vector<AFloat> & 
v )
 
   97      return std::accumulate(
v.begin(),
v.end(),AFloat{});
 
  105template <
typename AFloat>
 
  111   const AFloat  *dataOutput = 
output.GetRawDataPointer();
 
  117   auto f = [&dataDY, &dataY, &dataOutput, &dataWeights, 
m, norm](
UInt_t workerID) {
 
  118      AFloat 
y   = dataY[workerID];
 
  119      AFloat sig = 1.0 / (1.0 + 
exp(- dataOutput[workerID]));
 
  120      dataDY[workerID] = norm * (sig - 
y);
 
  121      dataDY[workerID] *= dataWeights[workerID % 
m];
 
  129template <
typename AFloat>
 
  134   const AFloat  *dataOutput = 
output.GetRawDataPointer();
 
  137   std::vector<AFloat> temp(Y.
GetNrows());
 
  140   AFloat norm = 1.0 / ((AFloat) 
m);
 
  142   auto f = [&dataY, &dataOutput, &dataWeights, &temp, 
n, 
m](
UInt_t workerID) {
 
  144      for (
size_t j = 0; j < 
n; j++) {
 
  145         sum += 
exp(dataOutput[workerID + j * 
m]);
 
  147      for (
size_t j = 0; j < 
n; j++) {
 
  149            dataY[workerID + j * 
m] * 
log(
exp(dataOutput[workerID + j * 
m]) / 
sum);
 
  151      temp[workerID] *= dataWeights[workerID];
 
  155   auto reduction = [](
const std::vector<AFloat> & 
v )
 
  157      return std::accumulate(
v.begin(),
v.end(),AFloat{});
 
  165template <
typename AFloat>
 
  171   const AFloat  *dataOutput = 
output.GetRawDataPointer();
 
  176   AFloat norm = 1.0 / ((AFloat) 
m);
 
  178   auto f = [&dataDY, &dataY, &dataOutput, &dataWeights, norm, 
n, 
m](
UInt_t workerID) {
 
  181      AFloat weight = dataWeights[workerID];
 
  182      for (
size_t j = 0; j < 
n; j++) {
 
  183         sum  += 
exp(dataOutput[workerID + j * 
m]);
 
  184         sumY += dataY[workerID + j * 
m];
 
  186      for (
size_t j = 0; j < 
n; j++) {
 
  187         dataDY[workerID + j * 
m] =
 
  188            norm * (
exp(dataOutput[workerID + j * 
m]) / 
sum * sumY - dataY[workerID + j * 
m]);
 
  189         dataDY[workerID + j * 
m] *= weight;
 
A pseudo container class which is a generator of indices.
auto Map(F func, unsigned nTimes) -> std::vector< typename std::result_of< F()>::type >
Execute func (with no arguments) nTimes in parallel.
auto Reduce(const std::vector< T > &objs, BINARYOP redfunc) -> decltype(redfunc(objs.front(), objs.front()))
"Reduce" an std::vector into a single object in parallel by passing a binary operator as the second a...
AFloat * GetRawDataPointer()
Return raw pointer to the elements stored contiguously in column-major order.
static ROOT::TThreadExecutor & GetThreadExecutor()
size_t GetNoElements() const
static void CrossEntropyGradients(TCpuMatrix< Scalar_t > &dY, const TCpuMatrix< Scalar_t > &Y, const TCpuMatrix< Scalar_t > &output, const TCpuMatrix< Scalar_t > &weights)
static Scalar_t SoftmaxCrossEntropy(const TCpuMatrix< Scalar_t > &Y, const TCpuMatrix< Scalar_t > &output, const TCpuMatrix< Scalar_t > &weights)
Softmax transformation is implicitly applied, thus output should hold the linear activations of the l...
static Scalar_t MeanSquaredError(const TCpuMatrix< Scalar_t > &Y, const TCpuMatrix< Scalar_t > &output, const TCpuMatrix< Scalar_t > &weights)
static void SoftmaxCrossEntropyGradients(TCpuMatrix< Scalar_t > &dY, const TCpuMatrix< Scalar_t > &Y, const TCpuMatrix< Scalar_t > &output, const TCpuMatrix< Scalar_t > &weights)
static void MeanSquaredErrorGradients(TCpuMatrix< Scalar_t > &dY, const TCpuMatrix< Scalar_t > &Y, const TCpuMatrix< Scalar_t > &output, const TCpuMatrix< Scalar_t > &weights)
static Scalar_t CrossEntropy(const TCpuMatrix< Scalar_t > &Y, const TCpuMatrix< Scalar_t > &output, const TCpuMatrix< Scalar_t > &weights)
Sigmoid transformation is implicitly applied, thus output should hold the linear activations of the l...
Abstract ClassifierFactory template that handles arbitrary types.
static long int sum(long int i)