Expression Templates Library (ETL)
conv_4d_full_expr.hpp
1 //=======================================================================
2 // Copyright (c) 2014-2023 Baptiste Wicht
3 // Distributed under the terms of the MIT License.
4 // (See accompanying file LICENSE or copy at
5 // http://opensource.org/licenses/MIT)
6 //=======================================================================
7 
8 #pragma once
9 
10 #include "etl/expr/base_temporary_expr.hpp"
11 
12 //Get the implementations
13 #include "etl/impl/conv.hpp"
14 
15 namespace etl {
16 
21 template <etl_4d A, etl_4d B, bool Flipped>
22 struct conv_4d_full_expr : base_temporary_expr_bin<conv_4d_full_expr<A, B, Flipped>, A, B> {
27 
28  static constexpr auto storage_order = left_traits::storage_order;
29 
34  static constexpr bool gpu_computable = cudnn_enabled && impl::cudnn::conv_possible_<A, B>;
35 
40  explicit conv_4d_full_expr(A a, B b) : base_type(a, b) {
41  //Nothing else to init
42  }
43 
44  // Assignment functions
45 
49  template <etl_4d I, etl_4d K, etl_4d C>
50  static void check([[maybe_unused]] const I& input, [[maybe_unused]] const K& kernel, [[maybe_unused]] const C& conv) {
51  if constexpr (all_fast<A, B, C>) {
52  static_assert(etl::dim<0, C>() == etl::dim<0, I>(), "Invalid dimensions for conv4_full");
53  static_assert(etl::dim<1, C>() == etl::dim<1, K>(), "Invalid dimensions for conv4_full");
54  static_assert(etl::dim<1, I>() == etl::dim<0, K>(), "Invalid dimensions for conv4_full");
55 
56  static_assert(etl::dim<2, C>() == etl::dim<2, I>() + etl::dim<2, K>() - 1, "Invalid dimensions for conv4_full");
57  static_assert(etl::dim<3, C>() == etl::dim<3, I>() + etl::dim<3, K>() - 1, "Invalid dimensions for conv4_full");
58  } else {
59  cpp_assert(etl::dim(conv, 0) == etl::dim(input, 0), "Invalid dimensions for conv4_full");
60  cpp_assert(etl::dim(conv, 1) == etl::dim(kernel, 1), "Invalid dimensions for conv4_full");
61  cpp_assert(etl::dim(input, 1) == etl::dim(kernel, 0), "Invalid dimensions for conv4_full");
62 
63  cpp_assert(etl::dim(conv, 2) == etl::dim(input, 2) + etl::dim(kernel, 2) - 1, "Invalid dimensions for conv4_full");
64  cpp_assert(etl::dim(conv, 3) == etl::dim(input, 3) + etl::dim(kernel, 3) - 1, "Invalid dimensions for conv4_full");
65  }
66  }
67 
72  template <etl_4d C>
73  void assign_to(C&& c) const {
74  inc_counter("temp:assign");
75 
76  auto& a = this->a();
77  auto& b = this->b();
78 
79  check(a, b, c);
80 
81  if constexpr (Flipped) {
83  } else {
85  }
86  }
87 
92  template <etl_4d L>
93  void assign_add_to(L&& lhs) const {
94  std_add_evaluate(*this, lhs);
95  }
96 
101  template <etl_4d L>
102  void assign_sub_to(L&& lhs) const {
103  std_sub_evaluate(*this, lhs);
104  }
105 
110  template <etl_4d L>
111  void assign_mul_to(L&& lhs) const {
112  std_mul_evaluate(*this, lhs);
113  }
114 
119  template <etl_4d L>
120  void assign_div_to(L&& lhs) const {
121  std_div_evaluate(*this, lhs);
122  }
123 
128  template <etl_4d L>
129  void assign_mod_to(L&& lhs) const {
130  std_mod_evaluate(*this, lhs);
131  }
132 
139  friend std::ostream& operator<<(std::ostream& os, const conv_4d_full_expr& expr) {
140  return os << "conv4_full(" << expr._a << ", " << expr._b << ")";
141  }
142 };
143 
148 template <etl_4d A, etl_4d B, bool Flipped>
149 struct etl_traits<etl::conv_4d_full_expr<A, B, Flipped>> {
151  using left_expr_t = std::decay_t<A>;
152  using right_expr_t = std::decay_t<B>;
156 
157  static constexpr bool is_etl = true;
158  static constexpr bool is_transformer = false;
159  static constexpr bool is_view = false;
160  static constexpr bool is_magic_view = false;
161  static constexpr bool is_fast = all_fast<A, B>;
162  static constexpr bool is_linear = false;
163  static constexpr bool is_thread_safe = true;
164  static constexpr bool is_value = false;
165  static constexpr bool is_direct = true;
166  static constexpr bool is_generator = false;
167  static constexpr bool is_padded = false;
168  static constexpr bool is_aligned = true;
169  static constexpr bool is_temporary = true;
170  static constexpr bool gpu_computable = is_gpu_t<value_type> && cuda_enabled;
171  static constexpr order storage_order = left_traits::storage_order;
172 
178  template <vector_mode_t V>
179  static constexpr bool vectorizable = true;
180 
185  template <size_t DD>
186  static constexpr size_t dim() {
187  return DD == 0 ? etl::dim<DD, A>() : DD == 1 ? etl::dim<DD, B>() : etl::dim<DD, A>() + etl::dim<DD, B>() - 1;
188  }
189 
196  static size_t dim(const expr_t& e, size_t d) {
197  if (d == 0) {
198  return etl::dim(e._a, 0);
199  } else if (d == 1) {
200  return etl::dim(e._b, 1);
201  } else {
202  return etl::dim(e._a, d) + etl::dim(e._b, d) - 1;
203  }
204  }
205 
211  static size_t size(const expr_t& e) {
212  return etl::dim(e._a, 0) * etl::dim(e._b, 1) * (etl::dim(e._a, 2) + etl::dim(e._b, 2) - 1) * (etl::dim(e._a, 3) + etl::dim(e._b, 3) - 1);
213  }
214 
219  static constexpr size_t size() {
220  return etl::dim<0, A>() * etl::dim<1, B>() * (etl::dim<2, A>() + etl::dim<2, B>() - 1) * (etl::dim<3, A>() + etl::dim<3, B>() - 1);
221  }
222 
227  static constexpr size_t dimensions() {
228  return 4;
229  }
230 
235  static constexpr int complexity() noexcept {
236  return -1;
237  }
238 };
239 
251 template <etl_4d A, etl_4d B>
253  return conv_4d_full_expr<detail::build_type<A>, detail::build_type<B>, false>{a, b};
254 }
255 
268 template <etl_4d A, etl_4d B, etl_4d C>
269 auto conv_4d_full(A&& a, B&& b, C&& c) {
270  c = conv_4d_full(a, b);
271 
272  return c;
273 }
274 
286 template <etl_4d A, etl_4d B>
287 conv_4d_full_expr<detail::build_type<A>, detail::build_type<B>, true> conv_4d_full_flipped(A&& a, B&& b) {
288  return conv_4d_full_expr<detail::build_type<A>, detail::build_type<B>, true>{a, b};
289 }
290 
303 template <etl_4d A, etl_4d B, etl_4d C>
304 auto conv_4d_full_flipped(A&& a, B&& b, C&& c) {
305  c = conv_4d_full_flipped(a, b);
306 
307  return c;
308 }
309 
310 } //end of namespace etl
static constexpr size_t dim()
Returns the DDth dimension of the expression.
Definition: conv_4d_full_expr.hpp:186
static size_t dim(const expr_t &e, size_t d)
Returns the dth dimension of the expression.
Definition: conv_4d_full_expr.hpp:196
B _b
The sub expression reference.
Definition: base_temporary_expr.hpp:534
std::decay_t< B > right_expr_t
The right sub expression type.
Definition: conv_4d_full_expr.hpp:152
static void check([[maybe_unused]] const I &input, [[maybe_unused]] const K &kernel, [[maybe_unused]] const C &conv)
Assert that the convolution is done on correct dimensions.
Definition: conv_4d_full_expr.hpp:50
constexpr bool is_magic_view
Traits indicating if the given ETL type is a magic view expression.
Definition: traits.hpp:311
A _a
The sub expression reference.
Definition: base_temporary_expr.hpp:533
static void apply(const I &input, const K &kernel, C &&conv)
Apply the convolution.
Definition: conv_4d.hpp:408
static constexpr size_t dimensions()
Returns the number of dimensions of the expression.
Definition: conv_4d_full_expr.hpp:227
static constexpr auto storage_order
The sub storage order.
Definition: conv_4d_full_expr.hpp:28
void assign_to(C &&c) const
Assign to a matrix of the full storage order.
Definition: conv_4d_full_expr.hpp:73
order
Storage order of a matrix.
Definition: order.hpp:15
constexpr bool cuda_enabled
Indicates if CUDA is available.
Definition: config.hpp:94
static constexpr bool gpu_computable
Indicates if the temporary expression can be directly evaluated using only GPU.
Definition: conv_4d_full_expr.hpp:34
conv_4d_full_expr(A a, B b)
Construct a new expression.
Definition: conv_4d_full_expr.hpp:40
Abstract base class for temporary binary expression.
Definition: base_temporary_expr.hpp:529
friend std::ostream & operator<<(std::ostream &os, const conv_4d_full_expr &expr)
Print a representation of the expression on the given stream.
Definition: conv_4d_full_expr.hpp:139
std::add_lvalue_reference_t< B > b()
Returns the sub expression.
Definition: base_temporary_expr.hpp:593
constexpr bool is_fast
Traits to test if the given ETL expresion type is fast (sizes known at compile-time) ...
Definition: traits.hpp:588
conv_4d_full_expr< detail::build_type< A >, detail::build_type< B >, false > conv_4d_full(A &&a, B &&b)
Creates an expression representing the &#39;full&#39; 1D convolution of a and b.
Definition: conv_4d_full_expr.hpp:252
void assign_div_to(L &&lhs) const
Divide the given left-hand-side expression.
Definition: conv_4d_full_expr.hpp:120
Traits to get information about ETL types.
Definition: tmp.hpp:68
void assign_sub_to(L &&lhs) const
Sub from the given left-hand-side expression.
Definition: conv_4d_full_expr.hpp:102
Root namespace for the ETL library.
Definition: adapter.hpp:15
auto dim(E &&value, size_t i) -> detail::identity_helper< E, dim_view< detail::build_identity_type< E >, D >>
Return a view representing the ith Dth dimension.
Definition: view_expression_builder.hpp:25
value_t< A > value_type
The type of value of the expression.
Definition: conv_4d_full_expr.hpp:23
static size_t size(const expr_t &e)
Returns the size of the expression.
Definition: conv_4d_full_expr.hpp:211
std::conditional_t< is_etl_value< T >, const std::decay_t< T > &, std::decay_t< T > > build_type
Helper to build the type for a sub expression.
Definition: expression_helpers.hpp:24
constexpr bool cudnn_enabled
Indicates if the NVIDIA CUDNN library is available for ETL.
Definition: config.hpp:114
void assign_add_to(L &&lhs) const
Add to the given left-hand-side expression.
Definition: conv_4d_full_expr.hpp:93
void assign_mod_to(L &&lhs) const
Modulo the given left-hand-side expression.
Definition: conv_4d_full_expr.hpp:129
void std_mod_evaluate(Expr &&expr, Result &&result)
Compound modulo evaluation of the expr into result.
Definition: evaluator.hpp:1271
static void apply(const I &input, const K &kernel, C &&conv)
Apply the convolution.
Definition: conv_4d.hpp:448
static constexpr int complexity() noexcept
Estimate the complexity of computation.
Definition: conv_4d_full_expr.hpp:235
void std_mul_evaluate(Expr &&expr, Result &&result)
Compound multiply evaluation of the expr into result.
Definition: evaluator.hpp:1233
constexpr bool is_transformer
Traits indicating if the given ETL type is a transformer expression.
Definition: traits.hpp:297
Selector for the convolution implementations.
constexpr bool is_view
Traits indicating if the given ETL type is a view expression.
Definition: traits.hpp:304
std::decay_t< A > left_expr_t
The left sub expression type.
Definition: conv_4d_full_expr.hpp:151
static constexpr size_t size()
Returns the size of the expression.
Definition: conv_4d_full_expr.hpp:219
void std_sub_evaluate(Expr &&expr, Result &&result)
Compound subtract evaluation of the expr into result.
Definition: evaluator.hpp:1214
constexpr bool is_thread_safe
Traits to test if the given ETL expresion type is thread safe.
Definition: traits.hpp:687
typename decay_traits< E >::value_type value_t
Traits to extract the value type out of an ETL type.
Definition: tmp.hpp:81
void assign_mul_to(L &&lhs) const
Multiply the given left-hand-side expression.
Definition: conv_4d_full_expr.hpp:111
void std_div_evaluate(Expr &&expr, Result &&result)
Compound divide evaluation of the expr into result.
Definition: evaluator.hpp:1252
void inc_counter([[maybe_unused]] const char *name)
Increase the given counter.
Definition: counters.hpp:25
conv_4d_full_expr< detail::build_type< A >, detail::build_type< B >, true > conv_4d_full_flipped(A &&a, B &&b)
Creates an expression representing the &#39;full&#39; 1D convolution of a and flipped b.
Definition: conv_4d_full_expr.hpp:287
std::add_lvalue_reference_t< A > a()
Returns the sub expression.
Definition: base_temporary_expr.hpp:577
void std_add_evaluate(Expr &&expr, Result &&result)
Compound add evaluation of the expr into result.
Definition: evaluator.hpp:1195
A transposition expression.
Definition: conv_4d_full_expr.hpp:22
value_t< A > value_type
The value type of the expression.
Definition: conv_4d_full_expr.hpp:155