Expression Templates Library (ETL)
conv_4d_backward_expr.hpp
1 //=======================================================================
2 // Copyright (c) 2014-2023 Baptiste Wicht
3 // Distributed under the terms of the MIT License.
4 // (See accompanying file LICENSE or copy at
5 // http://opensource.org/licenses/MIT)
6 //=======================================================================
7 
8 #pragma once
9 
10 #include "etl/expr/base_temporary_expr.hpp"
11 
12 //Get the implementations
13 #include "etl/impl/conv.hpp"
14 
15 namespace etl {
16 
43 template <etl_4d A, etl_4d B, size_t S1, size_t S2, size_t P1, size_t P2, bool Flipped>
44 struct conv_4d_backward_expr : base_temporary_expr_bin<conv_4d_backward_expr<A, B, S1, S2, P1, P2, Flipped>, A, B> {
49 
50  static constexpr auto storage_order = left_traits::storage_order;
51 
56  static constexpr bool gpu_computable = cudnn_enabled && impl::cudnn::conv_possible_<A, B>;
57 
62  explicit conv_4d_backward_expr(A a, B b) : base_type(a, b) {
63  //Nothing else to init
64  }
65 
66  // Assignment functions
67 
71  template <etl_4d I, etl_4d K, etl_4d C>
72  static void check([[maybe_unused]] const I& input, [[maybe_unused]] const K& kernel, [[maybe_unused]] const C& conv) {
73  if constexpr (all_fast<A, B, C>) {
74  static_assert(etl::dim<0, C>() == etl::dim<0, I>(), "Invalid dimensions for conv4_backward");
75  static_assert(etl::dim<1, C>() == etl::dim<1, K>(), "Invalid dimensions for conv4_backward");
76  static_assert(etl::dim<1, I>() == etl::dim<0, K>(), "Invalid dimensions for conv4_backward");
77 
78  static_assert(etl::dim<2, C>() == S1 * (etl::dim<2, I>() - 1) + etl::dim<2, K>() - 2 * P1, "Invalid dimensions for conv2_backward");
79  static_assert(etl::dim<3, C>() == S2 * (etl::dim<3, I>() - 1) + etl::dim<3, K>() - 2 * P2, "Invalid dimensions for conv2_backward");
80  } else {
81  cpp_assert(etl::dim(conv, 0) == etl::dim(input, 0), "Invalid dimensions for conv4_backward");
82  cpp_assert(etl::dim(conv, 1) == etl::dim(kernel, 1), "Invalid dimensions for conv4_backward");
83  cpp_assert(etl::dim(input, 1) == etl::dim(kernel, 0), "Invalid dimensions for conv4_backward");
84 
85  cpp_assert(etl::dim(conv, 2) == S1 * (etl::dim(input, 2) - 1) + etl::dim(kernel, 2) - 2 * P1, "Invalid dimensions for conv2_backward");
86  cpp_assert(etl::dim(conv, 3) == S2 * (etl::dim(input, 3) - 1) + etl::dim(kernel, 3) - 2 * P2, "Invalid dimensions for conv2_backward");
87  }
88  }
89 
94  template <etl_expr C>
95  void assign_to(C&& conv) const {
96  inc_counter("temp:assign");
97 
98  auto& input = this->a();
99  auto& kernel = this->b();
100 
101  check(input, kernel, conv);
102 
103  // Need K1 / K2 to compute transposed padding
104  const size_t K1 = etl::dim<2>(kernel);
105  const size_t K2 = etl::dim<3>(kernel);
106 
107  if constexpr (Flipped) {
108  // The GPU implementation needs the real forward parameters, not the
109  // converted backward parameters
110  if constexpr (cudnn_enabled && all_floating<A, B, C>) {
111  impl::cudnn::conv4_backward_data_flipped(smart_forward_gpu(input), smart_forward_gpu(kernel), conv, S1, S2, P1, P2);
112  return;
113  } else {
114  // 1. Handle unit strides
115  if constexpr (S1 == 1 && S2 == 1) {
116  if constexpr (P1 == 0 && P2 == 0) {
117  // Unit strides, non-zero padding -> Full convolution
118  detail::conv4_full_flipped_impl::apply(input, kernel, conv);
119  } else {
120  // Unit strides, zero padding -> Valid convolution with the correct padding
121  detail::dyn_conv4_valid_back_flipped_impl::apply(input, kernel, conv, 1, 1, K1 - P1 - 1, K2 - P2 - 1);
122  }
123  }
124  // 2. Handle non_unit strides
125  else {
126  // Fractionally-strided convolution needs inner padding of the input
127  auto strided_input = impl::common::inner_pad(input, S1, S2);
128 
129  if constexpr (P1 == 0 && P2 == 0) {
130  // Non-unit strides, non-zero padding -> Fractionally-strided full convolution
131  detail::conv4_full_flipped_impl::apply(strided_input, kernel, conv);
132  } else {
133  // Non-unit strides, zero padding -> Fractionally-strided Valid convolution with the correct padding
134  detail::dyn_conv4_valid_back_flipped_impl::apply(strided_input, kernel, conv, 1, 1, K1 - P1 - 1, K2 - P2 - 1);
135  }
136  }
137  }
138  } else {
139  // The GPU implementation needs the real forward parameters, not the
140  // converted backward parameters
141  if constexpr (cudnn_enabled && all_floating<A, B, C>) {
142  impl::cudnn::conv4_backward_data(smart_forward_gpu(input), smart_forward_gpu(kernel), conv, S1, S2, P1, P2);
143  return;
144  } else {
145  // 1. Handle unit strides
146  if constexpr (S1 == 1 && S2 == 1) {
147  if constexpr (P1 == 0 && P2 == 0) {
148  // Unit strides, non-zero padding -> Full convolution
149  detail::conv4_full_impl::apply(input, kernel, conv);
150  } else {
151  // Unit strides, zero padding -> Valid convolution with the correct padding
152  detail::dyn_conv4_valid_back_impl::apply(input, kernel, conv, 1, 1, K1 - P1 - 1, K2 - P2 - 1);
153  }
154  }
155  // 2. Handle non_unit strides
156  else {
157  // Fractionally-strided convolution needs inner padding of the input
158  auto strided_input = impl::common::inner_pad(input, S1, S2);
159 
160  if constexpr (P1 == 0 && P2 == 0) {
161  // Non-unit strides, non-zero padding -> Fractionally-strided full convolution
162  detail::conv4_full_impl::apply(strided_input, kernel, conv);
163  } else {
164  // Non-unit strides, zero padding -> Fractionally-strided Valid convolution with the correct padding
165  detail::dyn_conv4_valid_back_impl::apply(strided_input, kernel, conv, 1, 1, K1 - P1 - 1, K2 - P2 - 1);
166  }
167  }
168  }
169  }
170  }
171 
176  template <typename L>
177  void assign_add_to(L&& lhs) const {
178  std_add_evaluate(*this, lhs);
179  }
180 
185  template <typename L>
186  void assign_sub_to(L&& lhs) const {
187  std_sub_evaluate(*this, lhs);
188  }
189 
194  template <typename L>
195  void assign_mul_to(L&& lhs) const {
196  std_mul_evaluate(*this, lhs);
197  }
198 
203  template <typename L>
204  void assign_div_to(L&& lhs) const {
205  std_div_evaluate(*this, lhs);
206  }
207 
212  template <typename L>
213  void assign_mod_to(L&& lhs) const {
214  std_mod_evaluate(*this, lhs);
215  }
216 
223  friend std::ostream& operator<<(std::ostream& os, const conv_4d_backward_expr& expr) {
224  return os << "conv4_backward(" << expr._a << ", " << expr._b << ")";
225  }
226 };
227 
232 template <typename A, typename B, size_t S1, size_t S2, size_t P1, size_t P2, bool Flipped>
233 struct etl_traits<etl::conv_4d_backward_expr<A, B, S1, S2, P1, P2, Flipped>> {
235  using left_expr_t = std::decay_t<A>;
236  using right_expr_t = std::decay_t<B>;
240 
241  static constexpr bool is_etl = true;
242  static constexpr bool is_transformer = false;
243  static constexpr bool is_view = false;
244  static constexpr bool is_magic_view = false;
245  static constexpr bool is_fast = all_fast<A, B>;
246  static constexpr bool is_linear = false;
247  static constexpr bool is_thread_safe = true;
248  static constexpr bool is_value = false;
249  static constexpr bool is_direct = true;
250  static constexpr bool is_generator = false;
251  static constexpr bool is_padded = false;
252  static constexpr bool is_aligned = true;
253  static constexpr bool is_temporary = true;
254  static constexpr bool gpu_computable = is_gpu_t<value_type> && cuda_enabled;
255  static constexpr order storage_order = left_traits::storage_order;
256 
262  template <vector_mode_t V>
263  static constexpr bool vectorizable = true;
264 
269  template <size_t DD>
270  static constexpr size_t dim() {
271  return DD == 0
272  ? etl::dim<0, A>()
273  : DD == 1 ? etl::dim<1, B>()
274  : DD == 2 ? (S1 * (etl::dim<2, A>() - 1) + etl::dim<2, B>() - 2 * P1) : (S2 * (etl::dim<3, A>() - 1) + etl::dim<3, B>() - 2 * P2);
275  }
276 
283  static size_t dim(const expr_t& e, size_t d) {
284  if (d == 0) {
285  return etl::dim(e._a, 0);
286  } else if (d == 1) {
287  return etl::dim(e._b, 1);
288  } else if (d == 2) {
289  return S1 * (etl::dim(e._a, 2) - 1) + etl::dim(e._b, 2) - 2 * P1;
290  } else {
291  return S2 * (etl::dim(e._a, 3) - 1) + etl::dim(e._b, 3) - 2 * P2;
292  }
293  }
294 
300  static size_t size(const expr_t& e) {
301  return etl::dim(e._a, 0) * etl::dim(e._b, 1) * (S1 * (etl::dim(e._a, 2) - 1) + etl::dim(e._b, 2) - 2 * P1)
302  * (S2 * (etl::dim(e._a, 3) - 1) + etl::dim(e._b, 3) - 2 * P2);
303  }
304 
309  static constexpr size_t size() {
310  return etl::dim<0, A>() * etl::dim<1, B>() * (S1 * (etl::dim<2, A>() - 1) + etl::dim<2, B>() - 2 * P1)
311  * (S2 * (etl::dim<3, A>() - 1) + etl::dim<3, B>() - 2 * P2);
312  }
313 
318  static constexpr size_t dimensions() {
319  return 4;
320  }
321 
326  static constexpr int complexity() noexcept {
327  return -1;
328  }
329 };
330 
342 template <size_t S1 = 1, size_t S2 = 1, size_t P1 = 0, size_t P2 = 0, etl_expr A, etl_expr B>
344  return conv_4d_backward_expr<detail::build_type<A>, detail::build_type<B>, S1, S2, P1, P2, false>{a, b};
345 }
346 
360 template <size_t S1 = 1, size_t S2 = 1, size_t P1 = 0, size_t P2 = 0, etl_expr A, etl_expr B, etl_expr C>
361 auto conv_4d_backward(A&& a, B&& b, C&& c) {
362  c = conv_4d_backward<S1, S2, P1, P2>(a, b);
363 
364  return c;
365 }
366 
378 template <size_t S1 = 1, size_t S2 = 1, size_t P1 = 0, size_t P2 = 0, etl_expr A, etl_expr B>
379 conv_4d_backward_expr<detail::build_type<A>, detail::build_type<B>, S1, S2, P1, P2, true> conv_4d_backward_flipped(A&& a, B&& b) {
380  return conv_4d_backward_expr<detail::build_type<A>, detail::build_type<B>, S1, S2, P1, P2, true>{a, b};
381 }
382 
396 template <size_t S1 = 1, size_t S2 = 1, size_t P1 = 0, size_t P2 = 0, etl_expr A, etl_expr B, etl_expr C>
397 auto conv_4d_backward_flipped(A&& a, B&& b, C&& c) {
398  c = conv_4d_backward_flipped<S1, S2, P1, P2>(a, b);
399 
400  return c;
401 }
402 
403 } //end of namespace etl
static constexpr int complexity() noexcept
Estimate the complexity of computation.
Definition: conv_4d_backward_expr.hpp:326
Expression representing a batch of transposed 2D convolution of an batch of image with a set of kerne...
Definition: conv_4d_backward_expr.hpp:44
static constexpr auto storage_order
The sub storage order.
Definition: conv_4d_backward_expr.hpp:50
void assign_mod_to(L &&lhs) const
Modulo the given left-hand-side expression.
Definition: conv_4d_backward_expr.hpp:213
B _b
The sub expression reference.
Definition: base_temporary_expr.hpp:534
constexpr bool is_magic_view
Traits indicating if the given ETL type is a magic view expression.
Definition: traits.hpp:311
void assign_div_to(L &&lhs) const
Divide the given left-hand-side expression.
Definition: conv_4d_backward_expr.hpp:204
A _a
The sub expression reference.
Definition: base_temporary_expr.hpp:533
static void apply(const I &input, const K &kernel, C &&conv, size_t s1, size_t s2, size_t p1, size_t p2)
Apply the convolution.
Definition: conv_4d.hpp:380
static void apply(const I &input, const K &kernel, C &&conv)
Apply the convolution.
Definition: conv_4d.hpp:408
conv_4d_backward_expr(A a, B b)
Construct a new expression.
Definition: conv_4d_backward_expr.hpp:62
static size_t size(const expr_t &e)
Returns the size of the expression.
Definition: conv_4d_backward_expr.hpp:300
order
Storage order of a matrix.
Definition: order.hpp:15
constexpr bool cuda_enabled
Indicates if CUDA is available.
Definition: config.hpp:94
Abstract base class for temporary binary expression.
Definition: base_temporary_expr.hpp:529
conv_4d_backward_expr< detail::build_type< A >, detail::build_type< B >, S1, S2, P1, P2, false > conv_4d_backward(A &&a, B &&b)
Creates an expression representing the transposed 2D convolution of a and b.
Definition: conv_4d_backward_expr.hpp:343
std::add_lvalue_reference_t< B > b()
Returns the sub expression.
Definition: base_temporary_expr.hpp:593
constexpr bool is_fast
Traits to test if the given ETL expresion type is fast (sizes known at compile-time) ...
Definition: traits.hpp:588
Traits to get information about ETL types.
Definition: tmp.hpp:68
static constexpr size_t dim()
Returns the DDth dimension of the expression.
Definition: conv_4d_backward_expr.hpp:270
Root namespace for the ETL library.
Definition: adapter.hpp:15
conv_4d_backward_expr< detail::build_type< A >, detail::build_type< B >, S1, S2, P1, P2, true > conv_4d_backward_flipped(A &&a, B &&b)
Creates an expression representing the transposed 2D convolution of a and flipped b...
Definition: conv_4d_backward_expr.hpp:379
auto dim(E &&value, size_t i) -> detail::identity_helper< E, dim_view< detail::build_identity_type< E >, D >>
Return a view representing the ith Dth dimension.
Definition: view_expression_builder.hpp:25
static void check([[maybe_unused]] const I &input, [[maybe_unused]] const K &kernel, [[maybe_unused]] const C &conv)
Assert that the convolution is done on correct dimensions.
Definition: conv_4d_backward_expr.hpp:72
std::conditional_t< is_etl_value< T >, const std::decay_t< T > &, std::decay_t< T > > build_type
Helper to build the type for a sub expression.
Definition: expression_helpers.hpp:24
void assign_add_to(L &&lhs) const
Add to the given left-hand-side expression.
Definition: conv_4d_backward_expr.hpp:177
value_t< A > value_type
The type of value of the expression.
Definition: conv_4d_backward_expr.hpp:45
constexpr bool cudnn_enabled
Indicates if the NVIDIA CUDNN library is available for ETL.
Definition: config.hpp:114
static constexpr size_t size()
Returns the size of the expression.
Definition: conv_4d_backward_expr.hpp:309
static constexpr bool gpu_computable
Indicates if the temporary expression can be directly evaluated using only GPU.
Definition: conv_4d_backward_expr.hpp:56
void std_mod_evaluate(Expr &&expr, Result &&result)
Compound modulo evaluation of the expr into result.
Definition: evaluator.hpp:1271
static void apply(const I &input, const K &kernel, C &&conv)
Apply the convolution.
Definition: conv_4d.hpp:448
void std_mul_evaluate(Expr &&expr, Result &&result)
Compound multiply evaluation of the expr into result.
Definition: evaluator.hpp:1233
static constexpr size_t dimensions()
Returns the number of dimensions of the expression.
Definition: conv_4d_backward_expr.hpp:318
constexpr bool is_transformer
Traits indicating if the given ETL type is a transformer expression.
Definition: traits.hpp:297
Selector for the convolution implementations.
decltype(auto) smart_forward_gpu(E &expr)
Smart forwarding for a temporary expression that will be computed in GPU.
Definition: helpers.hpp:343
std::decay_t< A > left_expr_t
The left sub expression type.
Definition: conv_4d_backward_expr.hpp:235
constexpr bool is_view
Traits indicating if the given ETL type is a view expression.
Definition: traits.hpp:304
friend std::ostream & operator<<(std::ostream &os, const conv_4d_backward_expr &expr)
Print a representation of the expression on the given stream.
Definition: conv_4d_backward_expr.hpp:223
std::decay_t< B > right_expr_t
The right sub expression type.
Definition: conv_4d_backward_expr.hpp:236
void std_sub_evaluate(Expr &&expr, Result &&result)
Compound subtract evaluation of the expr into result.
Definition: evaluator.hpp:1214
constexpr bool is_thread_safe
Traits to test if the given ETL expresion type is thread safe.
Definition: traits.hpp:687
value_t< A > value_type
The value type of the expression.
Definition: conv_4d_backward_expr.hpp:239
static void apply(const I &input, const K &kernel, C &&conv, size_t s1, size_t s2, size_t p1, size_t p2)
Apply the convolution.
Definition: conv_4d.hpp:352
typename decay_traits< E >::value_type value_t
Traits to extract the value type out of an ETL type.
Definition: tmp.hpp:81
void std_div_evaluate(Expr &&expr, Result &&result)
Compound divide evaluation of the expr into result.
Definition: evaluator.hpp:1252
void assign_mul_to(L &&lhs) const
Multiply the given left-hand-side expression.
Definition: conv_4d_backward_expr.hpp:195
void assign_to(C &&conv) const
Assign to a matrix.
Definition: conv_4d_backward_expr.hpp:95
void inc_counter([[maybe_unused]] const char *name)
Increase the given counter.
Definition: counters.hpp:25
std::add_lvalue_reference_t< A > a()
Returns the sub expression.
Definition: base_temporary_expr.hpp:577
void assign_sub_to(L &&lhs) const
Sub from the given left-hand-side expression.
Definition: conv_4d_backward_expr.hpp:186
void std_add_evaluate(Expr &&expr, Result &&result)
Compound add evaluation of the expr into result.
Definition: evaluator.hpp:1195
static size_t dim(const expr_t &e, size_t d)
Returns the dth dimension of the expression.
Definition: conv_4d_backward_expr.hpp:283