wichtounet/etl/binary_2relu__derivative_8hpp_source.html

 //=======================================================================
 // Copyright (c) 2014-2023 Baptiste Wicht
 // Distributed under the terms of the MIT License.
 // (See accompanying file LICENSE or copy at
 //  http://opensource.org/licenses/MIT)
 //=======================================================================

 #pragma once

 namespace etl {

 template <typename T>
 struct relu_derivative_binary_op {
     static constexpr bool linear      = true;
     static constexpr bool thread_safe = true;
     static constexpr bool desc_func   = false;

     template <vector_mode_t V>
     static constexpr bool vectorizable = true;

     template <typename L, typename R>
     static constexpr bool gpu_computable = cudnn_enabled;

     static constexpr int complexity() {
         return 1;
     }

     template <typename V = default_vec>
     using vec_type = typename V::template vec_type<T>;

     static constexpr T apply(const T& lhs, const T& rhs) noexcept {
         return lhs > 0.0 ? rhs : 0.0;
     }

     template <typename V = default_vec>
     static ETL_STRONG_INLINE(vec_type<V>) load(const vec_type<V>& lhs, const vec_type<V>& rhs) noexcept {
         auto t1 = V::round_up(V::min(V::set(T(1.0)), lhs));

         return V::mul(t1, rhs);
     }

     template <typename L, typename R, typename Y>
     static auto gpu_compute_hint(const L& lhs, const R& rhs, Y& y) noexcept {
         decltype(auto) t1 = smart_gpu_compute_hint(lhs, y);
         decltype(auto) t2 = smart_gpu_compute_hint(rhs, y);
         decltype(auto) t3 = force_temporary_gpu_dim_only(t2);

         impl::cudnn::relu_backward(t1, t2, t3);

         return t3;
     }

     template <typename L, typename R, typename Y>
     static Y& gpu_compute(const L& lhs, const R& rhs, Y& y) noexcept {
         decltype(auto) t1 = smart_gpu_compute_hint(lhs, y);
         decltype(auto) t2 = smart_gpu_compute_hint(rhs, y);

         impl::cudnn::relu_backward(t1, t2, y);

         return y;
     }

     static std::string desc() noexcept {
         return "relu_back";
     }
 };

 } //end of namespace etl
etl::relu_derivative_binary_op::complexity
static constexpr int complexity()
Estimate the complexity of operator.
Definition: relu_derivative.hpp:39

etl::relu_derivative_binary_op::apply
static constexpr T apply(const T &lhs, const T &rhs) noexcept
Apply the unary operator on lhs and rhs.
Definition: relu_derivative.hpp:55

etl::relu_derivative_binary_op::vectorizable
static constexpr bool vectorizable
Indicates if the expression is vectorizable using the given vector mode.
Definition: relu_derivative.hpp:27

etl::relu_derivative_binary_op::linear
static constexpr bool linear
Indicates if the operator is linear or not.
Definition: relu_derivative.hpp:17

etl::relu_derivative_binary_op::desc_func
static constexpr bool desc_func
Indicates if the description must be printed as function.
Definition: relu_derivative.hpp:19

etl::relu_derivative_binary_op
Binary operator for relu derivative.
Definition: relu_derivative.hpp:16

etl::load
auto load(size_t x) const noexcept
Load several elements of the expression at once.
Definition: dyn_matrix_view.hpp:143

etl
Root namespace for the ETL library.
Definition: adapter.hpp:15

etl::relu_derivative_binary_op::gpu_computable
static constexpr bool gpu_computable
Indicates if the operator can be computed on GPU.
Definition: relu_derivative.hpp:33

etl::cudnn_enabled
constexpr bool cudnn_enabled
Indicates if the NVIDIA CUDNN library is available for ETL.
Definition: config.hpp:114

etl::relu_derivative_binary_op::thread_safe
static constexpr bool thread_safe
Indicates if the operator is thread safe or not.
Definition: relu_derivative.hpp:18

etl::relu_derivative_binary_op::desc
static std::string desc() noexcept
Returns a textual representation of the operator.
Definition: relu_derivative.hpp:114

etl::min
auto min(L &&lhs, R &&rhs)
Create an expression with the min value of lhs or rhs.
Definition: expression_builder.hpp:77

etl::force_temporary_gpu_dim_only
decltype(auto) force_temporary_gpu_dim_only(E &&expr)
Force a temporary out of the expression, without copying its content.
Definition: temporary.hpp:223

etl::relu_derivative_binary_op::gpu_compute_hint
static auto gpu_compute_hint(const L &lhs, const R &rhs, Y &y) noexcept
Compute the result of the operation using the GPU.
Definition: relu_derivative.hpp:82

etl::relu_derivative_binary_op::vec_type
typename V::template vec_type< T > vec_type
Definition: relu_derivative.hpp:47

etl::smart_gpu_compute_hint
decltype(auto) smart_gpu_compute_hint(E &expr, Y &y)
Compute the expression into a representation that is GPU up to date.
Definition: helpers.hpp:368

etl::relu_derivative_binary_op::ETL_STRONG_INLINE
static ETL_STRONG_INLINE(vec_type< V >) load(const vec_type< V > &lhs
Compute several applications of the operator at a time.

etl::relu_derivative_binary_op::gpu_compute
static Y & gpu_compute(const L &lhs, const R &rhs, Y &y) noexcept
Compute the result of the operation using the GPU.
Definition: relu_derivative.hpp:101