wichtounet/etl/cce_8hpp_source.html

 //=======================================================================
 // Copyright (c) 2014-2023 Baptiste Wicht
 // Distributed under the terms of the MIT License.
 // (See accompanying file LICENSE or copy at
 //  http://opensource.org/licenses/MIT)
 //=======================================================================

 #pragma once

 //Include the implementations
 #include "etl/impl/std/cce.hpp"
 #include "etl/impl/egblas/cce.hpp"

 namespace etl::detail {

 template <typename O, typename L>
 constexpr etl::cce_impl select_cce_impl() {
     if (impl::egblas::has_scce && impl::egblas::has_dcce) {
         return etl::cce_impl::EGBLAS;
     }

     return etl::cce_impl::STD;
 }

 template <typename O, typename L>
 constexpr etl::cce_impl select_cce_loss_impl() {
     if (impl::egblas::has_cce_sloss && impl::egblas::has_cce_dloss) {
         return etl::cce_impl::EGBLAS;
     }

     return etl::cce_impl::STD;
 }

 template <typename O, typename L>
 constexpr etl::cce_impl select_cce_error_impl() {
     if (impl::egblas::has_cce_serror && impl::egblas::has_cce_derror) {
         return etl::cce_impl::EGBLAS;
     }

     return etl::cce_impl::STD;
 }

 struct cce_impl {
     template <typename O, typename L>
     static std::pair<value_t<O>, value_t<O>> apply(const O& output, const L& labels, value_t<O> alpha, value_t<O> beta) {
         constexpr auto impl = select_cce_impl<O, L>();

         if constexpr (impl == etl::cce_impl::STD) {
             etl::force(output);
             etl::force(labels);

             return impl::standard::cce(output, labels, alpha, beta);
         } else if constexpr (impl == etl::cce_impl::EGBLAS) {
             decltype(auto) output_gpu = smart_forward_gpu(output);
             decltype(auto) labels_gpu = smart_forward_gpu(labels);

             output_gpu.ensure_gpu_up_to_date();
             labels_gpu.ensure_gpu_up_to_date();

             return impl::egblas::cce(etl::dim<0>(output), etl::dim<1>(output), alpha, beta, output_gpu.gpu_memory(), labels_gpu.gpu_memory());
         } else {
             cpp_unreachable("Invalid selection for CCE");
         }
     }
 };

 struct cce_loss_impl {
     template <typename O, typename L>
     static value_t<O> apply(const O& output, const L& labels, value_t<O> scale) {
         constexpr auto impl = select_cce_loss_impl<O, L>();

         if constexpr (impl == etl::cce_impl::STD) {
             etl::force(output);
             etl::force(labels);

             return impl::standard::cce_loss(output, labels, scale);
         } else if constexpr (impl == etl::cce_impl::EGBLAS) {
             decltype(auto) output_gpu = smart_forward_gpu(output);
             decltype(auto) labels_gpu = smart_forward_gpu(labels);

             output_gpu.ensure_gpu_up_to_date();
             labels_gpu.ensure_gpu_up_to_date();

             return impl::egblas::cce_loss(etl::size(output), scale, output_gpu.gpu_memory(), 1, labels_gpu.gpu_memory(), 1);
         } else {
             cpp_unreachable("Invalid selection for CCE");
         }
     }
 };

 struct cce_error_impl {
     template <typename O, typename L>
     static value_t<O> apply(const O& output, const L& labels, value_t<O> scale) {
         constexpr auto impl = select_cce_error_impl<O, L>();

         if constexpr (impl == etl::cce_impl::STD) {
             etl::force(output);
             etl::force(labels);

             return impl::standard::cce_error(output, labels, scale);
         } else if constexpr (impl == etl::cce_impl::EGBLAS) {
             decltype(auto) output_gpu = smart_forward_gpu(output);
             decltype(auto) labels_gpu = smart_forward_gpu(labels);

             output_gpu.ensure_gpu_up_to_date();
             labels_gpu.ensure_gpu_up_to_date();

             return impl::egblas::cce_error(etl::dim<0>(output), etl::dim<1>(output), scale, output_gpu.gpu_memory(), labels_gpu.gpu_memory());
         } else {
             cpp_unreachable("Invalid selection for CCE");
         }
     }
 };

 } //end of namespace etl::detail
etl::detail::cce_impl::apply
static std::pair< value_t< O >, value_t< O > > apply(const O &output, const L &labels, value_t< O > alpha, value_t< O > beta)
Apply the functor to e.
Definition: cce.hpp:77

cce.hpp
EGBLAS wrappers for the cce operations.

etl::detail::select_cce_error_impl
constexpr etl::cce_impl select_cce_error_impl()
Select the CCE implementation for an expression of type E.
Definition: cce.hpp:61

etl::batch_softmax_impl::STD
Standard implementation.

etl::force
void force(Expr &&expr)
Force the internal evaluation of an expression.
Definition: evaluator.hpp:1292

etl::detail
Definition: expression_builder.hpp:699

etl::detail::cce_error_impl
Sum operation implementation.
Definition: cce.hpp:132

etl::bce_impl::EGBLAS
GPU implementation.

etl::detail::select_cce_impl
constexpr etl::cce_impl select_cce_impl()
Select the CCE implementation for an expression of type E.
Definition: cce.hpp:31

etl::cce_impl
cce_impl
Enumeration describing the different implementations of CCE.
Definition: cce_impl.hpp:20

etl::scale
auto scale(LE &&lhs, RE &&rhs)
Builds an expression representing the scalar multiplication of lhs and rhs.
Definition: binary_expression_builder.hpp:64

etl::detail::cce_loss_impl
Sum operation implementation.
Definition: cce.hpp:102

cce.hpp
Standard implementation of the Categorical Cross Entropy reduction.

etl::detail::select_cce_loss_impl
constexpr etl::cce_impl select_cce_loss_impl()
Select the CCE implementation for an expression of type E.
Definition: cce.hpp:46

etl::smart_forward_gpu
decltype(auto) smart_forward_gpu(E &expr)
Smart forwarding for a temporary expression that will be computed in GPU.
Definition: helpers.hpp:343

etl::size
constexpr size_t size(const E &expr) noexcept
Returns the size of the given ETL expression.
Definition: helpers.hpp:108

etl::detail::cce_error_impl::apply
static value_t< O > apply(const O &output, const L &labels, value_t< O > scale)
Apply the functor to e.
Definition: cce.hpp:137

etl::value_t
typename decay_traits< E >::value_type value_t
Traits to extract the value type out of an ETL type.
Definition: tmp.hpp:81

etl::detail::cce_impl
Sum operation implementation.
Definition: cce.hpp:72

etl::detail::cce_loss_impl::apply
static value_t< O > apply(const O &output, const L &labels, value_t< O > scale)
Apply the functor to e.
Definition: cce.hpp:107