wichtounet/etl/pooling_8hpp_source.html

 //=======================================================================
 // Copyright (c) 2014-2023 Baptiste Wicht
 // Distributed under the terms of the MIT License.
 // (See accompanying file LICENSE or copy at
 //  http://opensource.org/licenses/MIT)
 //=======================================================================

 #pragma once

 // Include all the modules

 #include "etl/impl/max_pooling_derivative.hpp"
 #include "etl/impl/avg_pooling_derivative.hpp"

 // Include the implementations

 #include "etl/impl/std/max_pooling.hpp"
 #include "etl/impl/std/avg_pooling.hpp"
 #include "etl/impl/cudnn/max_pooling.hpp"

 namespace etl::impl {

 template <etl_dma X, etl_dma Y>
 constexpr etl::pool_impl select_default_pool_impl(bool no_gpu) {
     if (cudnn_enabled && all_floating<X, Y> && !no_gpu) {
         return etl::pool_impl::CUDNN;
     }

     return etl::pool_impl::STD;
 }

 #ifdef ETL_MANUAL_SELECT

 template <typename X, typename Y>
 etl::pool_impl select_pool_impl() {
     if (local_context().pool_selector.forced) {
         auto forced = local_context().pool_selector.impl;

         switch (forced) {
             // CUDNN cannot always be used
             case pool_impl::CUDNN:
                 if (!cudnn_enabled || !all_floating<X, Y> || local_context().cpu) {                                                  //COVERAGE_EXCLUDE_LINE
                     std::cerr << "Forced selection to CUDNN pool implementation, but not possible for this expression" << std::endl; //COVERAGE_EXCLUDE_LINE
                     return select_default_pool_impl<X, Y>(local_context().cpu);                                                      //COVERAGE_EXCLUDE_LINE
                 }                                                                                                                    //COVERAGE_EXCLUDE_LINE

                 return forced;

             //In other cases, simply use the forced impl
             default:
                 return forced;
         }
     }

     return select_default_pool_impl<X, Y>(local_context().cpu);
 }

 #else

 template <typename X, typename Y>
 constexpr etl::pool_impl select_pool_impl() {
     return select_default_pool_impl<X, Y>(false);
 }

 #endif

 struct max_pool_2d {
     template <typename A>
     static constexpr bool gpu_computable = cudnn_enabled;

     template <size_t C1, size_t C2, size_t S1, size_t S2, size_t P1, size_t P2, typename X, typename Y>
     static void apply(const X& x, Y&& y) {
         constexpr_select const auto impl = select_pool_impl<X, Y>();

         if
             constexpr_select(impl == pool_impl::STD) {
                 inc_counter("impl:std");
                 etl::impl::standard::max_pool_2d::apply<C1, C2, S1, S2, P1, P2>(smart_forward(x), y);
             }
         else if
             constexpr_select(impl == pool_impl::CUDNN) {
                 inc_counter("impl:cudnn");
                 etl::impl::cudnn::max_pool_2d::apply(smart_forward_gpu(x), y, C1, C2, S1, S2, P1, P2);
             }
         else {
             cpp_unreachable("Invalid selection for pooling");
         }
     }

     template <typename X, typename Y>
     static void apply(const X& x, Y&& y, size_t c1, size_t c2, size_t s1, size_t s2, size_t p1, size_t p2) {
         constexpr_select const auto impl = select_pool_impl<X, Y>();

         if
             constexpr_select(impl == pool_impl::STD) {
                 inc_counter("impl:std");
                 etl::impl::standard::max_pool_2d::apply(smart_forward(x), y, c1, c2, s1, s2, p1, p2);
             }
         else if
             constexpr_select(impl == pool_impl::CUDNN) {
                 inc_counter("impl:cudnn");
                 etl::impl::cudnn::max_pool_2d::apply(smart_forward_gpu(x), y, c1, c2, s1, s2, p1, p2);
             }
         else {
             cpp_unreachable("Invalid selection for pooling");
         }
     }
 };

 struct avg_pool_2d {
     template <typename A>
     static constexpr bool gpu_computable = cudnn_enabled;

     template <size_t C1, size_t C2, size_t S1, size_t S2, size_t P1, size_t P2, typename X, typename Y>
     static void apply(const X& x, Y&& y) {
         constexpr_select const auto impl = select_pool_impl<X, Y>();

         if
             constexpr_select(impl == pool_impl::STD) {
                 inc_counter("impl:std");
                 etl::impl::standard::avg_pool_2d::apply<C1, C2, S1, S2, P1, P2>(smart_forward(x), y);
             }
         else if
             constexpr_select(impl == pool_impl::CUDNN) {
                 inc_counter("impl:cudnn");
                 etl::impl::cudnn::avg_pool_2d::apply(smart_forward_gpu(x), y, C1, C2, S1, S2, P1, P2);
             }
         else {
             cpp_unreachable("Invalid selection for pooling");
         }
     }

     template <typename X, typename Y>
     static void apply(const X& x, Y&& y, size_t c1, size_t c2, size_t s1, size_t s2, size_t p1, size_t p2) {
         constexpr_select const auto impl = select_pool_impl<X, Y>();

         if
             constexpr_select(impl == pool_impl::STD) {
                 inc_counter("impl:std");
                 etl::impl::standard::avg_pool_2d::apply(smart_forward(x), y, c1, c2, s1, s2, p1, p2);
             }
         else if
             constexpr_select(impl == pool_impl::CUDNN) {
                 inc_counter("impl:cudnn");
                 etl::impl::cudnn::avg_pool_2d::apply(smart_forward_gpu(x), y, c1, c2, s1, s2, p1, p2);
             }
         else {
             cpp_unreachable("Invalid selection for pooling");
         }
     }
 };

 struct max_pool_3d {
     template <typename A>
     static constexpr bool gpu_computable = cudnn_enabled;

     template <size_t C1, size_t C2, size_t C3, size_t S1, size_t S2, size_t S3, size_t P1, size_t P2, size_t P3, typename X, typename Y>
     static void apply(const X& x, Y&& y) {
         constexpr_select const auto impl = select_pool_impl<X, Y>();

         if
             constexpr_select(impl == pool_impl::STD) {
                 inc_counter("impl:std");
                 etl::impl::standard::max_pool_3d::apply<C1, C2, C3, S1, S2, S3, P1, P2, P3>(smart_forward(x), y);
             }
         else if
             constexpr_select(impl == pool_impl::CUDNN) {
                 inc_counter("impl:cudnn");
                 etl::impl::cudnn::max_pool_3d::apply(smart_forward_gpu(x), y, C1, C2, C3, S1, S2, S3, P1, P2, P3);
             }
         else {
             cpp_unreachable("Invalid selection for pooling");
         }
     }

     template <typename X, typename Y>
     static void apply(const X& x, Y&& y, size_t c1, size_t c2, size_t c3, size_t s1, size_t s2, size_t s3, size_t p1, size_t p2, size_t p3) {
         constexpr_select const auto impl = select_pool_impl<X, Y>();

         if
             constexpr_select(impl == pool_impl::STD) {
                 inc_counter("impl:std");
                 etl::impl::standard::max_pool_3d::apply(smart_forward(x), y, c1, c2, c3, s1, s2, s3, p1, p2, p3);
             }
         else if
             constexpr_select(impl == pool_impl::CUDNN) {
                 inc_counter("impl:cudnn");
                 etl::impl::cudnn::max_pool_3d::apply(smart_forward_gpu(x), y, c1, c2, c3, s1, s2, s3, p1, p2, p3);
             }
         else {
             cpp_unreachable("Invalid selection for pooling");
         }
     }
 };

 struct avg_pool_3d {
     template <typename A>
     static constexpr bool gpu_computable = cudnn_enabled;

     template <size_t C1, size_t C2, size_t C3, size_t S1, size_t S2, size_t S3, size_t P1, size_t P2, size_t P3, typename X, typename Y>
     static void apply(const X& x, Y&& y) {
         constexpr_select const auto impl = select_pool_impl<X, Y>();

         if
             constexpr_select(impl == pool_impl::STD) {
                 inc_counter("impl:std");
                 etl::impl::standard::avg_pool_3d::apply<C1, C2, C3, S1, S2, S3, P1, P2, P3>(smart_forward(x), y);
             }
         else if
             constexpr_select(impl == pool_impl::CUDNN) {
                 inc_counter("impl:cudnn");
                 etl::impl::cudnn::avg_pool_3d::apply(smart_forward_gpu(x), y, C1, C2, C3, S1, S2, S3, P1, P2, P3);
             }
         else {
             cpp_unreachable("Invalid selection for pooling");
         }
     }

     template <typename X, typename Y>
     static void apply(const X& x, Y&& y, size_t c1, size_t c2, size_t c3, size_t s1, size_t s2, size_t s3, size_t p1, size_t p2, size_t p3) {
         const auto impl = select_pool_impl<X, Y>();

         if
             constexpr_select(impl == pool_impl::STD) {
                 inc_counter("impl:std");
                 etl::impl::standard::avg_pool_3d::apply(smart_forward(x), y, c1, c2, c3, s1, s2, s3, p1, p2, p3);
             }
         else if
             constexpr_select(impl == pool_impl::CUDNN) {
                 inc_counter("impl:cudnn");
                 etl::impl::cudnn::avg_pool_3d::apply(smart_forward_gpu(x), y, c1, c2, c3, s1, s2, s3, p1, p2, p3);
             }
         else {
             cpp_unreachable("Invalid selection for pooling");
         }
     }
 };

 } //end of namespace etl::impl
etl::impl::standard::avg_pool_3d::apply
static void apply(const A &sub, M &&m)
Apply the functor on sub and store the result in m.
Definition: avg_pooling.hpp:587

etl::pool_impl
pool_impl
Enumeration describing the different implementations of pooling.
Definition: pool_impl.hpp:21

etl::batch_softmax_impl::STD
Standard implementation.

etl::impl::avg_pool_2d::apply
static void apply(const X &x, Y &&y, size_t c1, size_t c2, size_t s1, size_t s2, size_t p1, size_t p2)
Pool x into y.
Definition: pooling.hpp:232

etl::impl::avg_pool_2d
Functor for 2D Average Pooling.
Definition: pooling.hpp:174

etl::impl::avg_pool_2d::apply
static void apply(const X &x, Y &&y)
Pool x into y.
Definition: pooling.hpp:198

etl::impl::max_pool_2d::apply
static void apply(const X &x, Y &&y)
Pool x into y.
Definition: pooling.hpp:118

etl::impl::standard::max_pool_3d::apply
static void apply(const A &sub, M &&m)
Apply the functor on sub and store the result in m.
Definition: max_pooling.hpp:855

etl::local_context
context & local_context()
Return the configuration context of the current thread.
Definition: context.hpp:50

etl::impl::max_pool_2d
Functor for 2D Max Pooling.
Definition: pooling.hpp:94

etl::impl::avg_pool_3d::apply
static void apply(const X &x, Y &&y, size_t c1, size_t c2, size_t c3, size_t s1, size_t s2, size_t s3, size_t p1, size_t p2, size_t p3)
Pool x into y.
Definition: pooling.hpp:392

etl::cudnn_enabled
constexpr bool cudnn_enabled
Indicates if the NVIDIA CUDNN library is available for ETL.
Definition: config.hpp:114

etl::impl::cudnn::max_pool_3d::apply
static void apply([[maybe_unused]] const X &x, [[maybe_unused]] Y &&y, [[maybe_unused]] size_t c1, [[maybe_unused]] size_t c2, [[maybe_unused]] size_t c3, [[maybe_unused]] size_t s1, [[maybe_unused]] size_t s2, [[maybe_unused]] size_t s3, [[maybe_unused]] size_t p1, [[maybe_unused]] size_t p2, [[maybe_unused]] size_t p3)
Apply the functor on sub and store the result in m.
Definition: max_pooling.hpp:249

etl::context::cpu
bool cpu
Force CPU evaluation.
Definition: context.hpp:29

etl::batch_softmax_impl::CUDNN
GPU implementation.

etl::impl::max_pool_2d::gpu_computable
static constexpr bool gpu_computable
Indicates if the temporary expression can be directly evaluated using only GPU.
Definition: pooling.hpp:100

etl::impl::cudnn::avg_pool_3d::apply
static void apply([[maybe_unused]] const X &x, [[maybe_unused]] Y &&y, [[maybe_unused]] size_t c1, [[maybe_unused]] size_t c2, [[maybe_unused]] size_t c3, [[maybe_unused]] size_t s1, [[maybe_unused]] size_t s2, [[maybe_unused]] size_t s3, [[maybe_unused]] size_t p1, [[maybe_unused]] size_t p2, [[maybe_unused]] size_t p3)
Apply the functor on sub and store the result in m.
Definition: max_pooling.hpp:276

etl::impl::avg_pool_3d::apply
static void apply(const X &x, Y &&y)
Pool x into y.
Definition: pooling.hpp:358

etl::smart_forward_gpu
decltype(auto) smart_forward_gpu(E &expr)
Smart forwarding for a temporary expression that will be computed in GPU.
Definition: helpers.hpp:343

etl::impl::standard::max_pool_2d::apply
static void apply(const A &sub, M &&m)
Apply the functor on sub and store the result in m.
Definition: max_pooling.hpp:134

etl::impl::max_pool_2d::apply
static void apply(const X &x, Y &&y, size_t c1, size_t c2, size_t s1, size_t s2, size_t p1, size_t p2)
Pool x into y.
Definition: pooling.hpp:152

etl::impl::avg_pool_3d
Functor for 3D Average Pooling.
Definition: pooling.hpp:334

etl::impl::standard::avg_pool_2d::apply
static void apply(const A &sub, M &&m)
Apply the functor on sub and store the result in m.
Definition: avg_pooling.hpp:127

etl::smart_forward
decltype(auto) smart_forward(E &expr)
Smart forwarding for a temporary expression.
Definition: helpers.hpp:323

etl::impl::max_pool_3d::apply
static void apply(const X &x, Y &&y)
Pool x into y.
Definition: pooling.hpp:278

etl::impl::cudnn::max_pool_2d::apply
static void apply([[maybe_unused]] const X &x, [[maybe_unused]] Y &&y, [[maybe_unused]] size_t c1, [[maybe_unused]] size_t c2, [[maybe_unused]] size_t s1, [[maybe_unused]] size_t s2, [[maybe_unused]] size_t p1, [[maybe_unused]] size_t p2)
Apply the functor on sub and store the result in m.
Definition: max_pooling.hpp:201

etl::impl
Definition: avg_pooling_derivative.hpp:10

etl::inc_counter
void inc_counter([[maybe_unused]] const char *name)
Increase the given counter.
Definition: counters.hpp:25

etl::impl::max_pool_3d::apply
static void apply(const X &x, Y &&y, size_t c1, size_t c2, size_t c3, size_t s1, size_t s2, size_t s3, size_t p1, size_t p2, size_t p3)
Pool x into y.
Definition: pooling.hpp:312

etl::impl::max_pool_3d
Functor for 3D Max Pooling.
Definition: pooling.hpp:254

etl::impl::cudnn::avg_pool_2d::apply
static void apply([[maybe_unused]] const X &x, [[maybe_unused]] Y &&y, [[maybe_unused]] size_t c1, [[maybe_unused]] size_t c2, [[maybe_unused]] size_t s1, [[maybe_unused]] size_t s2, [[maybe_unused]] size_t p1, [[maybe_unused]] size_t p2)
Apply the functor on sub and store the result in m.
Definition: max_pooling.hpp:225