Expression Templates Library (ETL)
dyn_pool_upsample_2d_expr.hpp
1 //=======================================================================
2 // Copyright (c) 2014-2023 Baptiste Wicht
3 // Distributed under the terms of the MIT License.
4 // (See accompanying file LICENSE or copy at
5 // http://opensource.org/licenses/MIT)
6 //=======================================================================
7 
8 #pragma once
9 
10 #include "etl/expr/base_temporary_expr.hpp"
11 
12 //Get the implementations
13 #include "etl/impl/std/max_pooling_upsample.hpp"
14 #include "etl/impl/std/avg_pooling_upsample.hpp"
15 #include "etl/impl/cudnn/pooling_upsample.hpp"
16 
17 namespace etl {
18 
25 template <etl_expr A, same_dimensions<A> B, same_dimensions<A> C, bool Max>
26 struct dyn_pool_upsample_2d_expr : base_temporary_expr_tern<dyn_pool_upsample_2d_expr<A, B, C, Max>, A, B, C> {
31 
32  static constexpr auto storage_order = sub_traits::storage_order;
33 
38  static constexpr bool gpu_computable = cudnn_enabled && all_floating<A, B> && all_homogeneous<A, B>;
39 
40 private:
41  const size_t c1;
42  const size_t c2;
43 
44  const size_t s1;
45  const size_t s2;
46 
47  const size_t p1;
48  const size_t p2;
49 
51 
52 public:
57  dyn_pool_upsample_2d_expr(A a, B b, C c, size_t c1, size_t c2, size_t s1, size_t s2, size_t p1, size_t p2) :
58  base_type(a, b, c), c1(c1), c2(c2), s1(s1), s2(s2), p1(p1), p2(p2) {
59  //Nothing else to init
60  }
61 
67  template <same_dimensions<A> R>
68  void check([[maybe_unused]] const A& a, [[maybe_unused]] const B& b, [[maybe_unused]] const C& c, [[maybe_unused]] const R& result) const {
69  static constexpr size_t D = etl::decay_traits<A>::dimensions();
70 
71  cpp_assert(etl::size(result) == etl::size(a), "max_pool_upsample_2d:A and R must have the same size");
72  cpp_assert(etl::size(b) == etl::size(c), "max_pool_upsample_2d:B and C must have the same size");
73 
74  cpp_assert(etl::dim<D - 2>(a) == s1 * (etl::dim<D - 2>(b) - 1) - 2 * p1 + c1, "Invalid pooling dimensions for max_pool_upsample_2d");
75  cpp_assert(etl::dim<D - 1>(a) == s2 * (etl::dim<D - 1>(b) - 1) - 2 * p2 + c2, "Invalid pooling dimensions for max_pool_upsample_2d");
76  }
77 
78  // Assignment functions
79 
87  template <typename R>
88  static constexpr etl::pool_impl select_default_impl(bool no_gpu) {
89  if (cudnn_enabled && all_floating<A, B, C, R> && !no_gpu) {
90  return etl::pool_impl::CUDNN;
91  }
92 
93  return etl::pool_impl::STD;
94  }
95 
96 #ifdef ETL_MANUAL_SELECT
97 
102  template <typename R>
103  static etl::pool_impl select_impl() {
104  if (local_context().pool_selector.forced) {
105  auto forced = local_context().pool_selector.impl;
106 
107  switch (forced) {
108  // CUDNN cannot always be used
109  case pool_impl::CUDNN:
110  if (!cudnn_enabled || !all_floating<A, B, C, R> || local_context().cpu) { //COVERAGE_EXCLUDE_LINE
111  std::cerr << "Forced selection to CUDNN pool implementation, but not possible for this expression" << std::endl; //COVERAGE_EXCLUDE_LINE
112  return select_default_impl<R>(local_context().cpu); //COVERAGE_EXCLUDE_LINE
113  } //COVERAGE_EXCLUDE_LINE
114 
115  return forced;
116 
117  //In other cases, simply use the forced impl
118  default:
119  return forced;
120  }
121  }
122 
123  return select_default_impl<R>(local_context().cpu);
124  }
125 
126 #else
127 
133  template <typename R>
134  static constexpr etl::pool_impl select_impl() {
135  return select_default_impl<R>(false);
136  }
137 
138 #endif
139 
140  // Assignment functions
141 
146  template <etl_expr R>
147  void assign_to(R&& result) const {
148  inc_counter("temp:assign");
149 
150  auto& a = this->a();
151  auto& b = this->b();
152  auto& c = this->c();
153 
154  check(a, b, c, result);
155 
156  constexpr_select auto impl = select_impl<R>();
157 
158  if constexpr (Max) {
159  if
160  constexpr_select(impl == pool_impl::STD) {
161  inc_counter("impl:std");
163  }
164  else if
165  constexpr_select(impl == pool_impl::CUDNN) {
166  inc_counter("impl:cudnn");
168  }
169  else {
170  cpp_unreachable("Invalid pool implementation");
171  }
172  } else {
173  if
174  constexpr_select(impl == pool_impl::STD) {
175  inc_counter("impl:std");
177  }
178  else if
179  constexpr_select(impl == pool_impl::CUDNN) {
180  inc_counter("impl:cudnn");
182  }
183  else {
184  cpp_unreachable("Invalid pool implementation");
185  }
186  }
187  }
188 
193  template <typename L>
194  void assign_add_to(L&& lhs) const {
195  std_add_evaluate(*this, lhs);
196  }
197 
202  template <typename L>
203  void assign_sub_to(L&& lhs) const {
204  std_sub_evaluate(*this, lhs);
205  }
206 
211  template <typename L>
212  void assign_mul_to(L&& lhs) const {
213  std_mul_evaluate(*this, lhs);
214  }
215 
220  template <typename L>
221  void assign_div_to(L&& lhs) const {
222  std_div_evaluate(*this, lhs);
223  }
224 
229  template <typename L>
230  void assign_mod_to(L&& lhs) const {
231  std_mod_evaluate(*this, lhs);
232  }
233 
240  friend std::ostream& operator<<(std::ostream& os, const dyn_pool_upsample_2d_expr& expr) {
241  return os << "max_pool_upsample2(" << expr._a << ", " << expr._b << ", " << expr._c << ")";
242  }
243 };
244 
249 template <typename A, typename B, typename C, bool Max>
250 struct etl_traits<etl::dyn_pool_upsample_2d_expr<A, B, C, Max>> {
252  using sub_expr_t = std::decay_t<A>;
255 
256  static constexpr bool is_etl = true;
257  static constexpr bool is_transformer = false;
258  static constexpr bool is_view = false;
259  static constexpr bool is_magic_view = false;
260  static constexpr bool is_fast = false;
261  static constexpr bool is_linear = false;
262  static constexpr bool is_thread_safe = true;
263  static constexpr bool is_value = false;
264  static constexpr bool is_direct = true;
265  static constexpr bool is_generator = false;
266  static constexpr bool is_padded = false;
267  static constexpr bool is_aligned = true;
268  static constexpr bool is_temporary = true;
269  static constexpr bool gpu_computable = is_gpu_t<value_type> && cuda_enabled;
270  static constexpr order storage_order = sub_traits::storage_order;
271 
277  template <vector_mode_t V>
278  static constexpr bool vectorizable = true;
279 
286  static size_t dim(const expr_t& e, size_t d) {
287  return etl::dim(e.a(), d);
288  }
289 
295  static size_t size(const expr_t& e) {
296  return etl::size(e.a());
297  }
298 
303  static constexpr size_t dimensions() {
304  return sub_traits::dimensions();
305  }
306 
311  static constexpr int complexity() noexcept {
312  return -1;
313  }
314 };
315 
324 template <typename A, typename B, typename C>
326  A&& input, B&& output, C&& errors, size_t c1, size_t c2) {
327  return {input, output, errors, c1, c2, c1, c2, 0, 0};
328 }
329 
338 template <typename A, typename B, typename C>
339 dyn_pool_upsample_2d_expr<detail::build_type<A>, detail::build_type<B>, detail::build_type<C>, true> max_pool_upsample_2d(
340  A&& input, B&& output, C&& errors, size_t c1, size_t c2, size_t s1, size_t s2, size_t p1 = 0, size_t p2 = 0) {
341  return {input, output, errors, c1, c2, s1, s2, p1, p2};
342 }
343 
352 template <typename A, typename B, typename C>
353 dyn_pool_upsample_2d_expr<detail::build_type<A>, detail::build_type<B>, detail::build_type<C>, false> avg_pool_upsample_2d(
354  A&& input, B&& output, C&& errors, size_t c1, size_t c2) {
355  return {input, output, errors, c1, c2, c1, c2, 0, 0};
356 }
357 
366 template <typename A, typename B, typename C>
367 dyn_pool_upsample_2d_expr<detail::build_type<A>, detail::build_type<B>, detail::build_type<C>, false> avg_pool_upsample_2d(
368  A&& input, B&& output, C&& errors, size_t c1, size_t c2, size_t s1, size_t s2, size_t p1 = 0, size_t p2 = 0) {
369  return {input, output, errors, c1, c2, s1, s2, p1, p2};
370 }
371 
372 } //end of namespace etl
value_t< A > value_type
The type of value of the expression.
Definition: dyn_pool_upsample_2d_expr.hpp:27
static constexpr auto storage_order
The sub storage order.
Definition: dyn_pool_upsample_2d_expr.hpp:32
std::add_lvalue_reference_t< B > b()
Returns the sub expression.
Definition: base_temporary_expr.hpp:702
static void apply([[maybe_unused]] A &&in, [[maybe_unused]] B &&out, [[maybe_unused]] C &&errors, [[maybe_unused]] M &m, [[maybe_unused]] size_t c1, [[maybe_unused]] size_t c2, [[maybe_unused]] size_t s1, [[maybe_unused]] size_t s2, [[maybe_unused]] size_t p1, [[maybe_unused]] size_t p2)
Apply the functor on sub and store the result in m.
Definition: pooling_upsample.hpp:263
pool_impl
Enumeration describing the different implementations of pooling.
Definition: pool_impl.hpp:21
Standard implementation.
constexpr bool is_magic_view
Traits indicating if the given ETL type is a magic view expression.
Definition: traits.hpp:311
static void apply(A &&in, B &&out, C &&errors, M &&m)
Apply the functor on sub and store the result in m.
Definition: max_pooling_upsample.hpp:410
D D
The number of dimensions.
Definition: dyn_matrix_view.hpp:24
void check([[maybe_unused]] const A &a, [[maybe_unused]] const B &b, [[maybe_unused]] const C &c, [[maybe_unused]] const R &result) const
Validate the transposition dimensions.
Definition: dyn_pool_upsample_2d_expr.hpp:68
void assign_sub_to(L &&lhs) const
Sub from the given left-hand-side expression.
Definition: dyn_pool_upsample_2d_expr.hpp:203
void assign_to(R &&result) const
Assign to a matrix of the same storage order.
Definition: dyn_pool_upsample_2d_expr.hpp:147
order
Storage order of a matrix.
Definition: order.hpp:15
constexpr bool cuda_enabled
Indicates if CUDA is available.
Definition: config.hpp:94
A _a
The first sub expression reference.
Definition: base_temporary_expr.hpp:638
static void apply([[maybe_unused]] A &&in, [[maybe_unused]] B &&out, [[maybe_unused]] C &&errors, [[maybe_unused]] M &m, [[maybe_unused]] size_t c1, [[maybe_unused]] size_t c2, [[maybe_unused]] size_t s1, [[maybe_unused]] size_t s2, [[maybe_unused]] size_t p1, [[maybe_unused]] size_t p2)
Apply the functor on sub and store the result in m.
Definition: pooling_upsample.hpp:213
static constexpr size_t dimensions()
Returns the number of dimensions of the expression.
Definition: dyn_pool_upsample_2d_expr.hpp:303
std::add_lvalue_reference_t< A > a()
Returns the sub expression.
Definition: base_temporary_expr.hpp:686
A derivative of the 2D max pooling (combine derivative and upsampling for performance) ...
Definition: dyn_pool_upsample_2d_expr.hpp:26
constexpr bool is_fast
Traits to test if the given ETL expresion type is fast (sizes known at compile-time) ...
Definition: traits.hpp:588
Traits to get information about ETL types.
Definition: tmp.hpp:68
void assign_mod_to(L &&lhs) const
Modulo the given left-hand-side expression.
Definition: dyn_pool_upsample_2d_expr.hpp:230
Root namespace for the ETL library.
Definition: adapter.hpp:15
static constexpr etl::pool_impl select_default_impl(bool no_gpu)
Select the pool implementation for an expression of type ABC->R.
Definition: dyn_pool_upsample_2d_expr.hpp:88
context & local_context()
Return the configuration context of the current thread.
Definition: context.hpp:50
static constexpr size_t dimensions()
Return the number of dimensions of the expression.
Definition: traits_base.hpp:31
static constexpr int complexity() noexcept
Estimate the complexity of computation.
Definition: dyn_pool_upsample_2d_expr.hpp:311
auto dim(E &&value, size_t i) -> detail::identity_helper< E, dim_view< detail::build_identity_type< E >, D >>
Return a view representing the ith Dth dimension.
Definition: view_expression_builder.hpp:25
static size_t size(const expr_t &e)
Returns the size of the expression.
Definition: dyn_pool_upsample_2d_expr.hpp:295
std::conditional_t< is_etl_value< T >, const std::decay_t< T > &, std::decay_t< T > > build_type
Helper to build the type for a sub expression.
Definition: expression_helpers.hpp:24
void assign_add_to(L &&lhs) const
Add to the given left-hand-side expression.
Definition: dyn_pool_upsample_2d_expr.hpp:194
constexpr bool cudnn_enabled
Indicates if the NVIDIA CUDNN library is available for ETL.
Definition: config.hpp:114
value_t< A > value_type
The value type of the expression.
Definition: dyn_pool_upsample_2d_expr.hpp:254
bool cpu
Force CPU evaluation.
Definition: context.hpp:29
GPU implementation.
void std_mod_evaluate(Expr &&expr, Result &&result)
Compound modulo evaluation of the expr into result.
Definition: evaluator.hpp:1271
Abstract base class for temporary ternary expression.
Definition: base_temporary_expr.hpp:634
friend std::ostream & operator<<(std::ostream &os, const dyn_pool_upsample_2d_expr &expr)
Print a representation of the expression on the given stream.
Definition: dyn_pool_upsample_2d_expr.hpp:240
void std_mul_evaluate(Expr &&expr, Result &&result)
Compound multiply evaluation of the expr into result.
Definition: evaluator.hpp:1233
void assign_mul_to(L &&lhs) const
Multiply the given left-hand-side expression.
Definition: dyn_pool_upsample_2d_expr.hpp:212
static constexpr etl::pool_impl select_impl()
Select the pool implementation for an expression of type ABC->R.
Definition: dyn_pool_upsample_2d_expr.hpp:134
constexpr bool is_transformer
Traits indicating if the given ETL type is a transformer expression.
Definition: traits.hpp:297
std::decay_t< A > sub_expr_t
The sub expression type.
Definition: dyn_pool_upsample_2d_expr.hpp:252
decltype(auto) smart_forward_gpu(E &expr)
Smart forwarding for a temporary expression that will be computed in GPU.
Definition: helpers.hpp:343
constexpr size_t size(const E &expr) noexcept
Returns the size of the given ETL expression.
Definition: helpers.hpp:108
static constexpr bool gpu_computable
Indicates if the temporary expression can be directly evaluated using only GPU.
Definition: dyn_pool_upsample_2d_expr.hpp:38
constexpr bool is_view
Traits indicating if the given ETL type is a view expression.
Definition: traits.hpp:304
void std_sub_evaluate(Expr &&expr, Result &&result)
Compound subtract evaluation of the expr into result.
Definition: evaluator.hpp:1214
decltype(auto) smart_forward(E &expr)
Smart forwarding for a temporary expression.
Definition: helpers.hpp:323
void assign_div_to(L &&lhs) const
Divide the given left-hand-side expression.
Definition: dyn_pool_upsample_2d_expr.hpp:221
constexpr bool is_thread_safe
Traits to test if the given ETL expresion type is thread safe.
Definition: traits.hpp:687
B _b
The second sub expression reference.
Definition: base_temporary_expr.hpp:639
static void apply([[maybe_unused]] A &&in, [[maybe_unused]] B &&out, C &&errors, M &&m)
Apply the functor on sub and store the result in m.
Definition: avg_pooling_upsample.hpp:327
C _c
The third sub expression reference.
Definition: base_temporary_expr.hpp:640
static size_t dim(const expr_t &e, size_t d)
Returns the dth dimension of the expression.
Definition: dyn_pool_upsample_2d_expr.hpp:286
typename decay_traits< E >::value_type value_t
Traits to extract the value type out of an ETL type.
Definition: tmp.hpp:81
void std_div_evaluate(Expr &&expr, Result &&result)
Compound divide evaluation of the expr into result.
Definition: evaluator.hpp:1252
void inc_counter([[maybe_unused]] const char *name)
Increase the given counter.
Definition: counters.hpp:25
std::add_lvalue_reference_t< C > c()
Returns the sub expression.
Definition: base_temporary_expr.hpp:718
dyn_pool_upsample_2d_expr< detail::build_type< A >, detail::build_type< B >, detail::build_type< C >, true > max_pool_upsample_2d(A &&input, B &&output, C &&errors, size_t c1, size_t c2)
Derivative of the 2D Max Pooling of the given matrix expression and upsampling.
Definition: dyn_pool_upsample_2d_expr.hpp:325
void std_add_evaluate(Expr &&expr, Result &&result)
Compound add evaluation of the expr into result.
Definition: evaluator.hpp:1195
dyn_pool_upsample_2d_expr< detail::build_type< A >, detail::build_type< B >, detail::build_type< C >, false > avg_pool_upsample_2d(A &&input, B &&output, C &&errors, size_t c1, size_t c2)
Derivative of the 2D Average Pooling of the given matrix expression and upsampling.
Definition: dyn_pool_upsample_2d_expr.hpp:353
dyn_pool_upsample_2d_expr(A a, B b, C c, size_t c1, size_t c2, size_t s1, size_t s2, size_t p1, size_t p2)
Construct a new expression.
Definition: dyn_pool_upsample_2d_expr.hpp:57