wichtounet/etl/pool__upsample__2d__expr_8hpp_source.html

 //=======================================================================
 // Copyright (c) 2014-2023 Baptiste Wicht
 // Distributed under the terms of the MIT License.
 // (See accompanying file LICENSE or copy at
 //  http://opensource.org/licenses/MIT)
 //=======================================================================

 #pragma once

 #include "etl/expr/base_temporary_expr.hpp"

 //Get the implementations
 #include "etl/impl/std/max_pooling_upsample.hpp"
 #include "etl/impl/std/avg_pooling_upsample.hpp"
 #include "etl/impl/cudnn/pooling_upsample.hpp"

 namespace etl {

 template <etl_expr A, same_dimensions<A> B, same_dimensions<A> C, size_t C1, size_t C2, size_t S1, size_t S2, size_t P1, size_t P2, bool Max>
 struct pool_upsample_2d_expr : base_temporary_expr_tern<pool_upsample_2d_expr<A, B, C, C1, C2, S1, S2, P1, P2, Max>, A, B, C> {
     using value_type = value_t<A>;
     using sub_traits = etl::decay_traits<A>;
     using this_type  = pool_upsample_2d_expr<A, B, C, C1, C2, S1, S2, P1, P2, Max>;
     using base_type  = base_temporary_expr_tern<this_type, A, B, C>;

     static constexpr auto storage_order = sub_traits::storage_order;

     static constexpr bool gpu_computable = cudnn_enabled && all_floating<A, B> && all_homogeneous<A, B>;

     friend struct etl_traits<pool_upsample_2d_expr>;

     pool_upsample_2d_expr(A a, B b, C c) : base_type(a, b, c) {
         //Nothing else to init
     }

     template <same_dimensions<A> R>
     static void check([[maybe_unused]] const A& a, [[maybe_unused]] const B& b, [[maybe_unused]] const C& c, [[maybe_unused]] const R& result) {
         static constexpr size_t D = etl::decay_traits<A>::dimensions();

         if constexpr (all_fast<A, B, C, R>) {
             static_assert(etl::decay_traits<R>::size() == etl::decay_traits<A>::size(), "max_pool_upsample_2d:A and R must have the same size");
             static_assert(etl::decay_traits<B>::size() == etl::decay_traits<C>::size(), "max_pool_upsample_2d:B and C must have the same size");

             static_assert(etl::decay_traits<A>::template dim<D - 2>() == S1 * (etl::decay_traits<B>::template dim<D - 2>() - 1) + C1 - 2 * P1,
                           "Invalid pooling dimensions for max_pool_upsample_2d");
             static_assert(etl::decay_traits<A>::template dim<D - 1>() == S2 * (etl::decay_traits<B>::template dim<D - 1>() - 1) + C2 - 2 * P2,
                           "Invalid pooling dimensions for max_pool_upsample_2d");
         } else {
             cpp_assert(etl::size(result) == etl::size(a), "max_pool_upsample_2d:A and R must have the same size");
             cpp_assert(etl::size(b) == etl::size(c), "max_pool_upsample_2d:B and C must have the same size");

             cpp_assert(etl::dim<D - 2>(a) == S1 * (etl::dim<D - 2>(b) - 1) + C1 - 2 * P1, "Invalid pooling dimensions for max_pool_upsample_2d");
             cpp_assert(etl::dim<D - 1>(a) == S2 * (etl::dim<D - 1>(b) - 1) + C2 - 2 * P2, "Invalid pooling dimensions for max_pool_upsample_2d");
         }
     }

     template <typename R>
     static constexpr etl::pool_impl select_default_impl(bool no_gpu) {
         if (cudnn_enabled && all_floating<A, B, C, R> && !no_gpu) {
             return etl::pool_impl::CUDNN;
         }

         return etl::pool_impl::STD;
     }

 #ifdef ETL_MANUAL_SELECT

     template <typename R>
     static etl::pool_impl select_impl() {
         if (local_context().pool_selector.forced) {
             auto forced = local_context().pool_selector.impl;

             switch (forced) {
                 // CUDNN cannot always be used
                 case pool_impl::CUDNN:
                     if (!cudnn_enabled || !all_floating<A, B, C, R> || local_context().cpu) {                                            //COVERAGE_EXCLUDE_LINE
                         std::cerr << "Forced selection to CUDNN pool implementation, but not possible for this expression" << std::endl; //COVERAGE_EXCLUDE_LINE
                         return select_default_impl<R>(local_context().cpu);                                                              //COVERAGE_EXCLUDE_LINE
                     }                                                                                                                    //COVERAGE_EXCLUDE_LINE

                     return forced;

                 //In other cases, simply use the forced impl
                 default:
                     return forced;
             }
         }

         return select_default_impl<R>(local_context().cpu);
     }

 #else

     template <typename R>
     static constexpr etl::pool_impl select_impl() {
         return select_default_impl<R>(false);
     }

 #endif

     // Assignment functions

     template <etl_expr R>
     void assign_to(R&& result) const {
         inc_counter("temp:assign");

         auto& a = this->a();
         auto& b = this->b();
         auto& c = this->c();

         check(a, b, c, result);

         constexpr_select auto impl = select_impl<R>();

         if constexpr (Max) {
             if
                 constexpr_select(impl == pool_impl::STD) {
                     inc_counter("impl:std");
                     impl::standard::max_pool_upsample_2d::apply<C1, C2, S1, S2, P1, P2>(smart_forward(a), smart_forward(b), smart_forward(c), result);
                 }
             else if
                 constexpr_select(impl == pool_impl::CUDNN) {
                     inc_counter("impl:cudnn");
                     impl::cudnn::max_pool_upsample_2d::apply(smart_forward_gpu(a), smart_forward_gpu(b), smart_forward_gpu(c), result, C1, C2, S1, S2, P1, P2);
                 }
             else {
                 cpp_unreachable("Invalid pool implementation");
             }
         } else {
             if
                 constexpr_select(impl == pool_impl::STD) {
                     inc_counter("impl:std");
                     impl::standard::avg_pool_upsample_2d::apply<C1, C2, S1, S2, P1, P2>(smart_forward(a), smart_forward(b), smart_forward(c), result);
                 }
             else if
                 constexpr_select(impl == pool_impl::CUDNN) {
                     inc_counter("impl:cudnn");
                     impl::cudnn::avg_pool_upsample_2d::apply(smart_forward_gpu(a), smart_forward_gpu(b), smart_forward_gpu(c), result, C1, C2, S1, S2, P1, P2);
                 }
             else {
                 cpp_unreachable("Invalid pool implementation");
             }
         }
     }

     template <typename L>
     void assign_add_to(L&& lhs) const {
         std_add_evaluate(*this, lhs);
     }

     template <typename L>
     void assign_sub_to(L&& lhs) const {
         std_sub_evaluate(*this, lhs);
     }

     template <typename L>
     void assign_mul_to(L&& lhs) const {
         std_mul_evaluate(*this, lhs);
     }

     template <typename L>
     void assign_div_to(L&& lhs) const {
         std_div_evaluate(*this, lhs);
     }

     template <typename L>
     void assign_mod_to(L&& lhs) const {
         std_mod_evaluate(*this, lhs);
     }

     friend std::ostream& operator<<(std::ostream& os, const pool_upsample_2d_expr& expr) {
         return os << "max_pool_upsample2(" << expr._a << ", " << expr._b << ", " << expr._c << ")";
     }
 };

 template <typename A, typename B, typename C, size_t C1, size_t C2, size_t S1, size_t S2, size_t P1, size_t P2, bool Max>
 struct etl_traits<etl::pool_upsample_2d_expr<A, B, C, C1, C2, S1, S2, P1, P2, Max>> {
     using expr_t     = etl::pool_upsample_2d_expr<A, B, C, C1, C2, S1, S2, P1, P2, Max>;
     using sub_expr_t = std::decay_t<A>;
     using sub_traits = etl_traits<sub_expr_t>;
     using value_type = value_t<A>;

     static constexpr bool is_etl         = true;
     static constexpr bool is_transformer = false;
     static constexpr bool is_view        = false;
     static constexpr bool is_magic_view  = false;
     static constexpr bool is_fast        = sub_traits::is_fast;
     static constexpr bool is_linear      = false;
     static constexpr bool is_thread_safe = true;
     static constexpr bool is_value       = false;
     static constexpr bool is_direct      = true;
     static constexpr bool is_generator   = false;
     static constexpr bool is_padded      = false;
     static constexpr bool is_aligned     = true;
     static constexpr bool is_temporary   = true;
     static constexpr bool gpu_computable = is_gpu_t<value_type> && cuda_enabled;
     static constexpr order storage_order = sub_traits::storage_order;

     template <vector_mode_t V>
     static constexpr bool vectorizable = true;

     template <size_t DD>
     static constexpr size_t dim() {
         return decay_traits<A>::template dim<DD>();
     }

     static size_t dim(const expr_t& e, size_t d) {
         return etl::dim(e.a(), d);
     }

     static size_t size(const expr_t& e) {
         return etl::size(e.a());
     }

     static constexpr size_t size() {
         return decay_traits<A>::size();
     }

     static constexpr size_t dimensions() {
         return sub_traits::dimensions();
     }

     static constexpr int complexity() noexcept {
         return -1;
     }
 };

 template <size_t C1, size_t C2, size_t S1 = C1, size_t S2 = C2, size_t P1 = 0, size_t P2 = 0, etl_expr A, etl_expr B, etl_expr C>
 pool_upsample_2d_expr<detail::build_type<A>, detail::build_type<B>, detail::build_type<C>, C1, C2, S1, S2, P1, P2, true> max_pool_upsample_2d(A&& input,
                                                                                                                                               B&& output,
                                                                                                                                               C&& errors) {
     return {input, output, errors};
 }

 template <size_t C1, size_t C2, size_t S1 = C1, size_t S2 = C2, size_t P1 = 0, size_t P2 = 0, etl_expr A, etl_expr B, etl_expr C>
 pool_upsample_2d_expr<detail::build_type<A>, detail::build_type<B>, detail::build_type<C>, C1, C2, S1, S2, P1, P2, false> avg_pool_upsample_2d(A&& input,
                                                                                                                                                B&& output,
                                                                                                                                                C&& errors) {
     return {input, output, errors};
 }

 } //end of namespace etl
etl::base_temporary_expr_tern< pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max >, A, B, C >::b
std::add_lvalue_reference_t< B > b()
Returns the sub expression.
Definition: base_temporary_expr.hpp:702

etl::pool_upsample_2d_expr::operator<<
friend std::ostream & operator<<(std::ostream &os, const pool_upsample_2d_expr &expr)
Print a representation of the expression on the given stream.
Definition: pool_upsample_2d_expr.hpp:236

etl::pool_upsample_2d_expr::pool_upsample_2d_expr
pool_upsample_2d_expr(A a, B b, C c)
Construct a new expression.
Definition: pool_upsample_2d_expr.hpp:46

etl::impl::cudnn::avg_pool_upsample_2d::apply
static void apply([[maybe_unused]] A &&in, [[maybe_unused]] B &&out, [[maybe_unused]] C &&errors, [[maybe_unused]] M &m, [[maybe_unused]] size_t c1, [[maybe_unused]] size_t c2, [[maybe_unused]] size_t s1, [[maybe_unused]] size_t s2, [[maybe_unused]] size_t p1, [[maybe_unused]] size_t p2)
Apply the functor on sub and store the result in m.
Definition: pooling_upsample.hpp:263

etl::pool_impl
pool_impl
Enumeration describing the different implementations of pooling.
Definition: pool_impl.hpp:21

etl::batch_softmax_impl::STD
Standard implementation.

etl::is_magic_view
constexpr bool is_magic_view
Traits indicating if the given ETL type is a magic view expression.
Definition: traits.hpp:311

etl::pool_upsample_2d_expr::select_default_impl
static constexpr etl::pool_impl select_default_impl(bool no_gpu)
Select the pool implementation for an expression of type ABC->R.
Definition: pool_upsample_2d_expr.hpp:84

etl::D
D D
The number of dimensions.
Definition: dyn_matrix_view.hpp:24

etl::etl_traits< etl::pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max > >::sub_expr_t
std::decay_t< A > sub_expr_t
The sub expression type.
Definition: pool_upsample_2d_expr.hpp:248

etl::order
order
Storage order of a matrix.
Definition: order.hpp:15

etl::cuda_enabled
constexpr bool cuda_enabled
Indicates if CUDA is available.
Definition: config.hpp:94

etl::base_temporary_expr_tern::_a
A _a
The first sub expression reference.
Definition: base_temporary_expr.hpp:638

etl::pool_upsample_2d_expr::assign_to
void assign_to(R &&result) const
Assign to a matrix of the same storage order.
Definition: pool_upsample_2d_expr.hpp:143

etl::pool_upsample_2d_expr::check
static void check([[maybe_unused]] const A &a, [[maybe_unused]] const B &b, [[maybe_unused]] const C &c, [[maybe_unused]] const R &result)
Validate the transposition dimensions.
Definition: pool_upsample_2d_expr.hpp:56

etl::impl::cudnn::max_pool_upsample_2d::apply
static void apply([[maybe_unused]] A &&in, [[maybe_unused]] B &&out, [[maybe_unused]] C &&errors, [[maybe_unused]] M &m, [[maybe_unused]] size_t c1, [[maybe_unused]] size_t c2, [[maybe_unused]] size_t s1, [[maybe_unused]] size_t s2, [[maybe_unused]] size_t p1, [[maybe_unused]] size_t p2)
Apply the functor on sub and store the result in m.
Definition: pooling_upsample.hpp:213

etl::pool_upsample_2d_expr::storage_order
static constexpr auto storage_order
The sub storage order.
Definition: pool_upsample_2d_expr.hpp:32

etl::etl_traits< etl::pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max > >::complexity
static constexpr int complexity() noexcept
Estimate the complexity of computation.
Definition: pool_upsample_2d_expr.hpp:324

etl::etl_traits< etl::pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max > >::value_type
value_t< A > value_type
The value type of the expression.
Definition: pool_upsample_2d_expr.hpp:250

etl::base_temporary_expr_tern< pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max >, A, B, C >::a
std::add_lvalue_reference_t< A > a()
Returns the sub expression.
Definition: base_temporary_expr.hpp:686

etl::is_fast
constexpr bool is_fast
Traits to test if the given ETL expresion type is fast (sizes known at compile-time) ...
Definition: traits.hpp:588

etl::pool_upsample_2d_expr::gpu_computable
static constexpr bool gpu_computable
Indicates if the temporary expression can be directly evaluated using only GPU.
Definition: pool_upsample_2d_expr.hpp:38

etl::etl_traits
Traits to get information about ETL types.
Definition: tmp.hpp:68

etl
Root namespace for the ETL library.
Definition: adapter.hpp:15

etl::etl_traits< etl::pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max > >::dim
static constexpr size_t dim()
Returns the DDth dimension of the expression.
Definition: pool_upsample_2d_expr.hpp:281

etl::local_context
context & local_context()
Return the configuration context of the current thread.
Definition: context.hpp:50

etl::etl_traits< etl::pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max > >::size
static constexpr size_t size()
Returns the size of the expression.
Definition: pool_upsample_2d_expr.hpp:308

etl::etl_traits::dimensions
static constexpr size_t dimensions()
Return the number of dimensions of the expression.
Definition: traits_base.hpp:31

etl::pool_upsample_2d_expr::assign_sub_to
void assign_sub_to(L &&lhs) const
Sub from the given left-hand-side expression.
Definition: pool_upsample_2d_expr.hpp:199

etl::dim
auto dim(E &&value, size_t i) -> detail::identity_helper< E, dim_view< detail::build_identity_type< E >, D >>
Return a view representing the ith Dth dimension.
Definition: view_expression_builder.hpp:25

etl::pool_upsample_2d_expr::assign_div_to
void assign_div_to(L &&lhs) const
Divide the given left-hand-side expression.
Definition: pool_upsample_2d_expr.hpp:217

etl::detail::build_type
std::conditional_t< is_etl_value< T >, const std::decay_t< T > &, std::decay_t< T > > build_type
Helper to build the type for a sub expression.
Definition: expression_helpers.hpp:24

etl::cudnn_enabled
constexpr bool cudnn_enabled
Indicates if the NVIDIA CUDNN library is available for ETL.
Definition: config.hpp:114

etl::context::cpu
bool cpu
Force CPU evaluation.
Definition: context.hpp:29

etl::batch_softmax_impl::CUDNN
GPU implementation.

etl::std_mod_evaluate
void std_mod_evaluate(Expr &&expr, Result &&result)
Compound modulo evaluation of the expr into result.
Definition: evaluator.hpp:1271

etl::base_temporary_expr_tern
Abstract base class for temporary ternary expression.
Definition: base_temporary_expr.hpp:634

etl::std_mul_evaluate
void std_mul_evaluate(Expr &&expr, Result &&result)
Compound multiply evaluation of the expr into result.
Definition: evaluator.hpp:1233

etl::is_transformer
constexpr bool is_transformer
Traits indicating if the given ETL type is a transformer expression.
Definition: traits.hpp:297

etl::smart_forward_gpu
decltype(auto) smart_forward_gpu(E &expr)
Smart forwarding for a temporary expression that will be computed in GPU.
Definition: helpers.hpp:343

etl::pool_upsample_2d_expr::assign_mod_to
void assign_mod_to(L &&lhs) const
Modulo the given left-hand-side expression.
Definition: pool_upsample_2d_expr.hpp:226

etl::size
constexpr size_t size(const E &expr) noexcept
Returns the size of the given ETL expression.
Definition: helpers.hpp:108

etl::etl_traits< etl::pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max > >::dimensions
static constexpr size_t dimensions()
Returns the number of dimensions of the expression.
Definition: pool_upsample_2d_expr.hpp:316

etl::is_view
constexpr bool is_view
Traits indicating if the given ETL type is a view expression.
Definition: traits.hpp:304

etl::pool_upsample_2d_expr::assign_mul_to
void assign_mul_to(L &&lhs) const
Multiply the given left-hand-side expression.
Definition: pool_upsample_2d_expr.hpp:208

etl::etl_traits::is_fast
static constexpr bool is_fast
Indicates if T is a fast structure.
Definition: traits_base.hpp:25

etl::etl_traits< etl::pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max > >::size
static size_t size(const expr_t &e)
Returns the size of the expression.
Definition: pool_upsample_2d_expr.hpp:300

etl::etl_traits< etl::pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max > >::dim
static size_t dim(const expr_t &e, size_t d)
Returns the dth dimension of the expression.
Definition: pool_upsample_2d_expr.hpp:291

etl::std_sub_evaluate
void std_sub_evaluate(Expr &&expr, Result &&result)
Compound subtract evaluation of the expr into result.
Definition: evaluator.hpp:1214

etl::smart_forward
decltype(auto) smart_forward(E &expr)
Smart forwarding for a temporary expression.
Definition: helpers.hpp:323

etl::pool_upsample_2d_expr
A derivative of the 2D max pooling (combine derivative and upsampling for performance) ...
Definition: pool_upsample_2d_expr.hpp:26

etl::is_thread_safe
constexpr bool is_thread_safe
Traits to test if the given ETL expresion type is thread safe.
Definition: traits.hpp:687

etl::base_temporary_expr_tern::_b
B _b
The second sub expression reference.
Definition: base_temporary_expr.hpp:639

etl::base_temporary_expr_tern::_c
C _c
The third sub expression reference.
Definition: base_temporary_expr.hpp:640

etl::pool_upsample_2d_expr::assign_add_to
void assign_add_to(L &&lhs) const
Add to the given left-hand-side expression.
Definition: pool_upsample_2d_expr.hpp:190

etl::value_t
typename decay_traits< E >::value_type value_t
Traits to extract the value type out of an ETL type.
Definition: tmp.hpp:81

etl::std_div_evaluate
void std_div_evaluate(Expr &&expr, Result &&result)
Compound divide evaluation of the expr into result.
Definition: evaluator.hpp:1252

etl::inc_counter
void inc_counter([[maybe_unused]] const char *name)
Increase the given counter.
Definition: counters.hpp:25

etl::pool_upsample_2d_expr::value_type
value_t< A > value_type
The type of value of the expression.
Definition: pool_upsample_2d_expr.hpp:27

etl::base_temporary_expr_tern< pool_upsample_2d_expr< A, B, C, C1, C2, S1, S2, P1, P2, Max >, A, B, C >::c
std::add_lvalue_reference_t< C > c()
Returns the sub expression.
Definition: base_temporary_expr.hpp:718

etl::max_pool_upsample_2d
dyn_pool_upsample_2d_expr< detail::build_type< A >, detail::build_type< B >, detail::build_type< C >, true > max_pool_upsample_2d(A &&input, B &&output, C &&errors, size_t c1, size_t c2)
Derivative of the 2D Max Pooling of the given matrix expression and upsampling.
Definition: dyn_pool_upsample_2d_expr.hpp:325

etl::std_add_evaluate
void std_add_evaluate(Expr &&expr, Result &&result)
Compound add evaluation of the expr into result.
Definition: evaluator.hpp:1195

etl::avg_pool_upsample_2d
dyn_pool_upsample_2d_expr< detail::build_type< A >, detail::build_type< B >, detail::build_type< C >, false > avg_pool_upsample_2d(A &&input, B &&output, C &&errors, size_t c1, size_t c2)
Derivative of the 2D Average Pooling of the given matrix expression and upsampling.
Definition: dyn_pool_upsample_2d_expr.hpp:353

etl::pool_upsample_2d_expr::select_impl
static constexpr etl::pool_impl select_impl()
Select the pool implementation for an expression of type ABC->R.
Definition: pool_upsample_2d_expr.hpp:130