Expression Templates Library (ETL)
dyn_conv_2d_valid_multi_expr.hpp
1 //=======================================================================
2 // Copyright (c) 2014-2023 Baptiste Wicht
3 // Distributed under the terms of the MIT License.
4 // (See accompanying file LICENSE or copy at
5 // http://opensource.org/licenses/MIT)
6 //=======================================================================
7 
8 #pragma once
9 
10 #include "etl/expr/base_temporary_expr.hpp"
11 
12 //Get the implementations
13 #include "etl/impl/conv.hpp"
14 
15 namespace etl {
16 
25 template <etl_2d A, etl_3d B, bool Flipped>
26 struct dyn_conv_2d_valid_multi_expr : base_temporary_expr_bin<dyn_conv_2d_valid_multi_expr<A, B, Flipped>, A, B> {
31 
32  static constexpr auto storage_order = left_traits::storage_order;
33 
38  static constexpr bool gpu_computable = cudnn_enabled && impl::cudnn::conv_possible_<A, B>;
39 
40  const size_t s1;
41  const size_t s2;
42  const size_t p1;
43  const size_t p2;
44 
49  explicit dyn_conv_2d_valid_multi_expr(A a, B b, size_t s1, size_t s2, size_t p1, size_t p2) : base_type(a, b), s1(s1), s2(s2), p1(p1), p2(p2) {
50  //Nothing else to init
51  }
52 
53  // Assignment functions
54 
58  template <etl_2d I, etl_3d K, etl_3d C>
59  void check([[maybe_unused]] const I& input, [[maybe_unused]] const K& kernel, [[maybe_unused]] const C& conv) const {
60  cpp_assert(etl::dim(conv, 0) == etl::dim(kernel, 0), "Invalid dimensions for conv_2d_valid_multi");
61  cpp_assert(etl::dim(conv, 1) == (etl::dim(input, 0) - etl::dim(kernel, 1) + 2 * p1) / s1 + 1, "Invalid dimensions for conv_2d_valid_multi");
62  cpp_assert(etl::dim(conv, 2) == (etl::dim(input, 1) - etl::dim(kernel, 2) + 2 * p2) / s2 + 1, "Invalid dimensions for conv_2d_valid_multi");
63  }
64 
69  template <etl_expr C>
70  void assign_to(C&& c) const {
71  inc_counter("temp:assign");
72 
73  auto& a = this->a();
74  auto& b = this->b();
75 
76  check(a, b, c);
77 
78  if constexpr (Flipped) {
80  } else {
81  detail::dyn_conv2_valid_multi_impl::apply(a, b, c, s1, s2, p1, p2);
82  }
83  }
84 
89  template <typename L>
90  void assign_add_to(L&& lhs) const {
91  std_add_evaluate(*this, lhs);
92  }
93 
98  template <typename L>
99  void assign_sub_to(L&& lhs) const {
100  std_sub_evaluate(*this, lhs);
101  }
102 
107  template <typename L>
108  void assign_mul_to(L&& lhs) const {
109  std_mul_evaluate(*this, lhs);
110  }
111 
116  template <typename L>
117  void assign_div_to(L&& lhs) const {
118  std_div_evaluate(*this, lhs);
119  }
120 
125  template <typename L>
126  void assign_mod_to(L&& lhs) const {
127  std_mod_evaluate(*this, lhs);
128  }
129 
136  friend std::ostream& operator<<(std::ostream& os, const dyn_conv_2d_valid_multi_expr& expr) {
137  return os << "conv2_valid_multi(" << expr._a << ", " << expr._b << ")";
138  }
139 };
140 
145 template <typename A, typename B, bool Flipped>
146 struct etl_traits<etl::dyn_conv_2d_valid_multi_expr<A, B, Flipped>> {
148  using left_expr_t = std::decay_t<A>;
149  using right_expr_t = std::decay_t<B>;
153 
154  static constexpr bool is_etl = true;
155  static constexpr bool is_transformer = false;
156  static constexpr bool is_view = false;
157  static constexpr bool is_magic_view = false;
158  static constexpr bool is_fast = false;
159  static constexpr bool is_linear = false;
160  static constexpr bool is_thread_safe = true;
161  static constexpr bool is_value = false;
162  static constexpr bool is_direct = true;
163  static constexpr bool is_generator = false;
164  static constexpr bool is_padded = false;
165  static constexpr bool is_aligned = true;
166  static constexpr bool is_temporary = true;
167  static constexpr bool gpu_computable = is_gpu_t<value_type> && cuda_enabled;
168  static constexpr order storage_order = left_traits::storage_order;
169 
175  template <vector_mode_t V>
176  static constexpr bool vectorizable = true;
177 
184  static size_t dim(const expr_t& e, size_t d) {
185  if (d == 0) {
186  return etl::dim(e._b, 0);
187  } else if (d == 1) {
188  return (etl::dim(e._a, 0) - etl::dim(e._b, 1) + 2 * e.p1) / e.s1 + 1;
189  } else {
190  return (etl::dim(e._a, 1) - etl::dim(e._b, 2) + 2 * e.p2) / e.s2 + 1;
191  }
192  }
193 
199  static size_t size(const expr_t& e) {
200  return (etl::dim(e._b, 0)) * ((etl::dim(e._a, 0) - etl::dim(e._b, 1) + 2 * e.p1) / e.s1 + 1)
201  * ((etl::dim(e._a, 1) - etl::dim(e._b, 2) + 2 * e.p2) / e.s2 + 1);
202  }
203 
208  static constexpr size_t dimensions() {
209  return 3;
210  }
211 
216  static constexpr int complexity() noexcept {
217  return -1;
218  }
219 };
220 
231 template <etl_expr A, etl_expr B>
233  A&& a, B&& b, size_t s1, size_t s2, size_t p1 = 0, size_t p2 = 0) {
234  return dyn_conv_2d_valid_multi_expr<detail::build_type<A>, detail::build_type<B>, false>{a, b, s1, s2, p1, p2};
235 }
236 
248 template <etl_expr A, etl_expr B, etl_expr C>
249 auto conv_2d_valid_multi(A&& a, B&& b, C&& c, size_t s1, size_t s2, size_t p1, size_t p2) {
250  c = conv_2d_valid_multi(a, b, s1, s2, p1, p2);
251 
252  return c;
253 }
254 
265 template <etl_expr A, etl_expr B>
267  A&& a, B&& b, size_t s1, size_t s2, size_t p1 = 0, size_t p2 = 0) {
268  return dyn_conv_2d_valid_multi_expr<detail::build_type<A>, detail::build_type<B>, true>{a, b, s1, s2, p1, p2};
269 }
270 
282 template <etl_expr A, etl_expr B, etl_expr C>
283 auto conv_2d_valid_multi_flipped(A&& a, B&& b, C&& c, size_t s1, size_t s2, size_t p1, size_t p2) {
284  c = conv_2d_valid_multi_flipped(a, b, s1, s2, p1, p2);
285 
286  return c;
287 }
288 
289 } //end of namespace etl
dyn_conv_2d_valid_multi_expr(A a, B b, size_t s1, size_t s2, size_t p1, size_t p2)
Construct a new expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:49
static constexpr auto storage_order
The sub storage order.
Definition: dyn_conv_2d_valid_multi_expr.hpp:32
conv_2d_valid_multi_expr< detail::build_type< A >, detail::build_type< B >, S1, S2, P1, P2, true > conv_2d_valid_multi_flipped(A &&a, B &&b)
Creates an expression representing the &#39;valid&#39; 1D convolution of a and flipped b. ...
Definition: conv_2d_valid_multi_expr.hpp:274
B _b
The sub expression reference.
Definition: base_temporary_expr.hpp:534
static size_t size(const expr_t &e)
Returns the size of the expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:199
conv_2d_valid_multi_expr< detail::build_type< A >, detail::build_type< B >, S1, S2, P1, P2, false > conv_2d_valid_multi(A &&a, B &&b)
Creates an expression representing the &#39;valid&#39; 1D convolution of a and b.
Definition: conv_2d_valid_multi_expr.hpp:245
constexpr bool is_magic_view
Traits indicating if the given ETL type is a magic view expression.
Definition: traits.hpp:311
A _a
The sub expression reference.
Definition: base_temporary_expr.hpp:533
void assign_div_to(L &&lhs) const
Divide the given left-hand-side expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:117
void assign_to(C &&c) const
Assign to a matrix of the full storage order.
Definition: dyn_conv_2d_valid_multi_expr.hpp:70
static void apply(I &&input, K &&kernel, C &&conv, size_t s1, size_t s2, size_t p1, size_t p2)
Apply the convolution.
Definition: conv_multi.hpp:272
static size_t dim(const expr_t &e, size_t d)
Returns the dth dimension of the expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:184
order
Storage order of a matrix.
Definition: order.hpp:15
static constexpr size_t dimensions()
Returns the number of dimensions of the expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:208
constexpr bool cuda_enabled
Indicates if CUDA is available.
Definition: config.hpp:94
Abstract base class for temporary binary expression.
Definition: base_temporary_expr.hpp:529
value_t< A > value_type
The type of value of the expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:27
static constexpr int complexity() noexcept
Estimate the complexity of computation.
Definition: dyn_conv_2d_valid_multi_expr.hpp:216
std::add_lvalue_reference_t< B > b()
Returns the sub expression.
Definition: base_temporary_expr.hpp:593
friend std::ostream & operator<<(std::ostream &os, const dyn_conv_2d_valid_multi_expr &expr)
Print a representation of the expression on the given stream.
Definition: dyn_conv_2d_valid_multi_expr.hpp:136
void check([[maybe_unused]] const I &input, [[maybe_unused]] const K &kernel, [[maybe_unused]] const C &conv) const
Assert that the convolution is done on correct dimensions.
Definition: dyn_conv_2d_valid_multi_expr.hpp:59
void assign_sub_to(L &&lhs) const
Sub from the given left-hand-side expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:99
constexpr bool is_fast
Traits to test if the given ETL expresion type is fast (sizes known at compile-time) ...
Definition: traits.hpp:588
const size_t p2
The padding of the second dimension.
Definition: dyn_conv_2d_valid_multi_expr.hpp:43
Traits to get information about ETL types.
Definition: tmp.hpp:68
Root namespace for the ETL library.
Definition: adapter.hpp:15
void assign_add_to(L &&lhs) const
Add to the given left-hand-side expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:90
value_t< A > value_type
The value type of the expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:152
auto dim(E &&value, size_t i) -> detail::identity_helper< E, dim_view< detail::build_identity_type< E >, D >>
Return a view representing the ith Dth dimension.
Definition: view_expression_builder.hpp:25
std::conditional_t< is_etl_value< T >, const std::decay_t< T > &, std::decay_t< T > > build_type
Helper to build the type for a sub expression.
Definition: expression_helpers.hpp:24
const size_t p1
The padding of the first dimension.
Definition: dyn_conv_2d_valid_multi_expr.hpp:42
constexpr bool cudnn_enabled
Indicates if the NVIDIA CUDNN library is available for ETL.
Definition: config.hpp:114
Expression for the &#39;valid&#39; convolution of several kernels with one input image.
Definition: dyn_conv_2d_valid_multi_expr.hpp:26
const size_t s2
The stride of the second dimension.
Definition: dyn_conv_2d_valid_multi_expr.hpp:41
void std_mod_evaluate(Expr &&expr, Result &&result)
Compound modulo evaluation of the expr into result.
Definition: evaluator.hpp:1271
void assign_mul_to(L &&lhs) const
Multiply the given left-hand-side expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:108
static void apply(I &&input, K &&kernel, C &&conv, size_t s1, size_t s2, size_t p1, size_t p2)
Apply the convolution.
Definition: conv_multi.hpp:222
void std_mul_evaluate(Expr &&expr, Result &&result)
Compound multiply evaluation of the expr into result.
Definition: evaluator.hpp:1233
constexpr bool is_transformer
Traits indicating if the given ETL type is a transformer expression.
Definition: traits.hpp:297
Selector for the convolution implementations.
const size_t s1
The stride of the first dimension.
Definition: dyn_conv_2d_valid_multi_expr.hpp:40
constexpr bool is_view
Traits indicating if the given ETL type is a view expression.
Definition: traits.hpp:304
std::decay_t< B > right_expr_t
The right sub expression type.
Definition: dyn_conv_2d_valid_multi_expr.hpp:149
void std_sub_evaluate(Expr &&expr, Result &&result)
Compound subtract evaluation of the expr into result.
Definition: evaluator.hpp:1214
void assign_mod_to(L &&lhs) const
Modulo the given left-hand-side expression.
Definition: dyn_conv_2d_valid_multi_expr.hpp:126
std::decay_t< A > left_expr_t
The left sub expression type.
Definition: dyn_conv_2d_valid_multi_expr.hpp:148
constexpr bool is_thread_safe
Traits to test if the given ETL expresion type is thread safe.
Definition: traits.hpp:687
static constexpr bool gpu_computable
Indicates if the temporary expression can be directly evaluated using only GPU.
Definition: dyn_conv_2d_valid_multi_expr.hpp:38
typename decay_traits< E >::value_type value_t
Traits to extract the value type out of an ETL type.
Definition: tmp.hpp:81
void std_div_evaluate(Expr &&expr, Result &&result)
Compound divide evaluation of the expr into result.
Definition: evaluator.hpp:1252
void inc_counter([[maybe_unused]] const char *name)
Increase the given counter.
Definition: counters.hpp:25
std::add_lvalue_reference_t< A > a()
Returns the sub expression.
Definition: base_temporary_expr.hpp:577
void std_add_evaluate(Expr &&expr, Result &&result)
Compound add evaluation of the expr into result.
Definition: evaluator.hpp:1195