Expression Templates Library (ETL)
conv_1d_valid_expr.hpp
1 //=======================================================================
2 // Copyright (c) 2014-2023 Baptiste Wicht
3 // Distributed under the terms of the MIT License.
4 // (See accompanying file LICENSE or copy at
5 // http://opensource.org/licenses/MIT)
6 //=======================================================================
7 
8 #pragma once
9 
10 #include "etl/expr/base_temporary_expr.hpp"
11 
12 //Get the implementations
13 #include "etl/impl/conv.hpp"
14 #include "etl/impl/conv_select.hpp"
15 
16 namespace etl {
17 
22 template <etl_1d A, etl_1d B>
23 struct conv_1d_valid_expr : base_temporary_expr_bin<conv_1d_valid_expr<A, B>, A, B> {
28 
29  static constexpr auto storage_order = left_traits::storage_order;
30 
35  static constexpr bool gpu_computable = false;
36 
41  explicit conv_1d_valid_expr(A a, B b) : base_type(a, b) {
42  //Nothing else to init
43  }
44 
45  // Assignment functions
46 
50  template <etl_1d I, etl_1d K, etl_1d C>
51  static void check([[maybe_unused]] const I& input, [[maybe_unused]] const K& kernel, [[maybe_unused]] const C& conv) {
52  if constexpr (all_fast<A, B, C>) {
53  static_assert(etl::dim<0, C>() == etl::dim<0, I>() - etl::dim<0, K>() + 1, "Invalid dimensions for conv1_valid");
54  static_assert(etl::dim<0, I>() >= etl::dim<0, K>(), "Invalid dimensions for conv1_valid");
55  } else {
56  cpp_assert(etl::dim(conv, 0) == etl::dim(input, 0) - etl::dim(kernel, 0) + 1, "Invalid dimensions for conv1_valid");
57  cpp_assert(etl::dim(input, 0) >= etl::dim(kernel, 0), "Invalid dimensions for conv1_valid");
58  }
59  }
60 
65  template <etl_1d C>
66  void assign_to(C&& conv) const {
67  inc_counter("temp:assign");
68 
69  auto& input_raw = this->a();
70  auto& kernel_raw = this->b();
71 
72  check(input_raw, kernel_raw, conv);
73 
74  // Execute the correct implementation
75 
76  constexpr_select const auto impl = detail::select_conv1_impl_new<conv_type::VALID, A, B, C>();
77 
78  if constexpr_select (impl == etl::conv_impl::VEC) {
79  inc_counter("impl:vec");
80 
81  if constexpr (parallel_support) {
82  bool parallel_dispatch = detail::select_parallel(input_raw, kernel_raw, conv);
83 
84  if (parallel_dispatch) {
85  decltype(auto) input = make_temporary(input_raw);
86  decltype(auto) kernel = make_temporary(kernel_raw);
87 
88  engine_dispatch_1d([&](size_t first, size_t last) { impl::vec::conv1_valid(input, kernel, conv, first, last); },
89  0,
90  etl::size(conv),
91  parallel_dispatch);
92  } else {
93  impl::vec::conv1_valid(smart_forward(input_raw), smart_forward(kernel_raw), conv, 0, etl::size(conv));
94  }
95  } else {
96  impl::vec::conv1_valid(smart_forward(input_raw), smart_forward(kernel_raw), conv, 0, etl::size(conv));
97  }
98  } else if constexpr_select (impl == etl::conv_impl::STD) {
99  inc_counter("impl:std");
100 
101  if constexpr (parallel_support) {
102  bool parallel_dispatch = detail::select_parallel(input_raw, kernel_raw, conv);
103 
104  if (parallel_dispatch) {
105  decltype(auto) input = make_temporary(input_raw);
106  decltype(auto) kernel = make_temporary(kernel_raw);
107 
108  engine_dispatch_1d([&](size_t first, size_t last) { impl::standard::conv1_valid(input, kernel, conv, first, last); },
109  0,
110  etl::size(conv),
111  parallel_dispatch);
112  } else {
113  impl::standard::conv1_valid(smart_forward(input_raw), smart_forward(kernel_raw), conv, 0, etl::size(conv));
114  }
115  } else {
116  impl::standard::conv1_valid(smart_forward(input_raw), smart_forward(kernel_raw), conv, 0, etl::size(conv));
117  }
118  } else if constexpr_select (impl == etl::conv_impl::EGBLAS) {
119  inc_counter("impl:egblas");
120 
121  if constexpr (all_homogeneous<A, B, C>) {
122  decltype(auto) input = smart_forward_gpu(input_raw);
123  decltype(auto) kernel = smart_forward_gpu(kernel_raw);
124 
125  input.ensure_gpu_up_to_date();
126  kernel.ensure_gpu_up_to_date();
127 
128  conv.ensure_gpu_allocated();
129 
130  impl::egblas::conv1_valid(
131  etl::size(input_raw), etl::size(kernel_raw), value_type(1), input.gpu_memory(), 1, kernel.gpu_memory(), 1, conv.gpu_memory(), 1);
132 
133  conv.validate_gpu();
134  conv.invalidate_cpu();
135  } else {
136  cpp_unreachable("Invalid conv implementation selection");
137  }
138  } else {
139  cpp_unreachable("Invalid conv implementation selection");
140  }
141  }
142 
147  template <etl_1d L>
148  void assign_add_to(L&& lhs) const {
149  std_add_evaluate(*this, lhs);
150  }
151 
156  template <etl_1d L>
157  void assign_sub_to(L&& lhs) const {
158  std_sub_evaluate(*this, lhs);
159  }
160 
165  template <etl_1d L>
166  void assign_mul_to(L&& lhs) const {
167  std_mul_evaluate(*this, lhs);
168  }
169 
174  template <etl_1d L>
175  void assign_div_to(L&& lhs) const {
176  std_div_evaluate(*this, lhs);
177  }
178 
183  template <etl_1d L>
184  void assign_mod_to(L&& lhs) const {
185  std_mod_evaluate(*this, lhs);
186  }
187 
194  friend std::ostream& operator<<(std::ostream& os, const conv_1d_valid_expr& expr) {
195  return os << "conv1_valid(" << expr._a << ", " << expr._b << ")";
196  }
197 };
198 
203 template <etl_1d A, etl_1d B>
206  using left_expr_t = std::decay_t<A>;
207  using right_expr_t = std::decay_t<B>;
211 
212  static constexpr bool is_etl = true;
213  static constexpr bool is_transformer = false;
214  static constexpr bool is_view = false;
215  static constexpr bool is_magic_view = false;
216  static constexpr bool is_fast = all_fast<A, B>;
217  static constexpr bool is_linear = false;
218  static constexpr bool is_thread_safe = true;
219  static constexpr bool is_value = false;
220  static constexpr bool is_direct = true;
221  static constexpr bool is_generator = false;
222  static constexpr bool is_padded = false;
223  static constexpr bool is_aligned = true;
224  static constexpr bool is_temporary = true;
225  static constexpr bool gpu_computable = is_gpu_t<value_type> && cuda_enabled;
226  static constexpr order storage_order = left_traits::storage_order;
227 
233  template <vector_mode_t V>
234  static constexpr bool vectorizable = true;
235 
240  template <size_t DD>
241  static constexpr size_t dim() {
242  return etl::dim<0, A>() - etl::dim<0, B>() + 1;
243  }
244 
251  static size_t dim(const expr_t& e, [[maybe_unused]] size_t d) {
252  return etl::dim(e._a, 0) - etl::dim(e._b, 0) + 1;
253  }
254 
260  static size_t size(const expr_t& e) {
261  return etl::dim(e._a, 0) - etl::dim(e._b, 0) + 1;
262  }
263 
268  static constexpr size_t size() {
269  return etl::dim<0, A>() - etl::dim<0, B>() + 1;
270  }
271 
276  static constexpr size_t dimensions() {
277  return 1;
278  }
279 
284  static constexpr int complexity() noexcept {
285  return -1;
286  }
287 };
288 
295 template <etl_1d A, etl_1d B>
298 }
299 
307 template <etl_1d A, etl_1d B, etl_1d C>
308 auto conv_1d_valid(A&& a, B&& b, C&& c) {
309  c = conv_1d_valid(a, b);
310 
311  return c;
312 }
313 
314 } //end of namespace etl
static void check([[maybe_unused]] const I &input, [[maybe_unused]] const K &kernel, [[maybe_unused]] const C &conv)
Assert that the convolution is done on correct dimensions.
Definition: conv_1d_valid_expr.hpp:51
void engine_dispatch_1d(Functor &&functor, size_t first, size_t last, [[maybe_unused]] size_t threshold, [[maybe_unused]] size_t n_threads=etl::threads)
Dispatch the elements of a range to a functor in a parallel manner, using the global thread engine...
Definition: parallel_support.hpp:708
B _b
The sub expression reference.
Definition: base_temporary_expr.hpp:534
friend std::ostream & operator<<(std::ostream &os, const conv_1d_valid_expr &expr)
Print a representation of the expression on the given stream.
Definition: conv_1d_valid_expr.hpp:194
static constexpr auto storage_order
The sub storage order.
Definition: conv_1d_valid_expr.hpp:29
Standard implementation.
constexpr bool is_magic_view
Traits indicating if the given ETL type is a magic view expression.
Definition: traits.hpp:311
A _a
The sub expression reference.
Definition: base_temporary_expr.hpp:533
static constexpr int complexity() noexcept
Estimate the complexity of computation.
Definition: conv_1d_valid_expr.hpp:284
conv_1d_valid_expr< detail::build_type< A >, detail::build_type< B > > conv_1d_valid(A &&a, B &&b)
Creates an expression representing the valid 1D convolution of a and b.
Definition: conv_1d_valid_expr.hpp:296
order
Storage order of a matrix.
Definition: order.hpp:15
constexpr bool cuda_enabled
Indicates if CUDA is available.
Definition: config.hpp:94
Abstract base class for temporary binary expression.
Definition: base_temporary_expr.hpp:529
VEC implementation.
static constexpr size_t size()
Returns the size of the expression.
Definition: conv_1d_valid_expr.hpp:268
std::add_lvalue_reference_t< B > b()
Returns the sub expression.
Definition: base_temporary_expr.hpp:593
constexpr bool is_fast
Traits to test if the given ETL expresion type is fast (sizes known at compile-time) ...
Definition: traits.hpp:588
static constexpr size_t dim()
Returns the DDth dimension of the expression.
Definition: conv_1d_valid_expr.hpp:241
std::decay_t< A > left_expr_t
The left sub expression type.
Definition: conv_1d_valid_expr.hpp:206
Traits to get information about ETL types.
Definition: tmp.hpp:68
Root namespace for the ETL library.
Definition: adapter.hpp:15
A transposition expression.
Definition: conv_1d_valid_expr.hpp:23
GPU implementation.
auto dim(E &&value, size_t i) -> detail::identity_helper< E, dim_view< detail::build_identity_type< E >, D >>
Return a view representing the ith Dth dimension.
Definition: view_expression_builder.hpp:25
void assign_mod_to(L &&lhs) const
Modulo the given left-hand-side expression.
Definition: conv_1d_valid_expr.hpp:184
std::conditional_t< is_etl_value< T >, const std::decay_t< T > &, std::decay_t< T > > build_type
Helper to build the type for a sub expression.
Definition: expression_helpers.hpp:24
static constexpr size_t dimensions()
Returns the number of dimensions of the expression.
Definition: conv_1d_valid_expr.hpp:276
void assign_mul_to(L &&lhs) const
Multiply the given left-hand-side expression.
Definition: conv_1d_valid_expr.hpp:166
void assign_sub_to(L &&lhs) const
Sub from the given left-hand-side expression.
Definition: conv_1d_valid_expr.hpp:157
void std_mod_evaluate(Expr &&expr, Result &&result)
Compound modulo evaluation of the expr into result.
Definition: evaluator.hpp:1271
value_t< A > value_type
The type of value of the expression.
Definition: conv_1d_valid_expr.hpp:24
void assign_to(C &&conv) const
Assign to a matrix of the same storage order.
Definition: conv_1d_valid_expr.hpp:66
void std_mul_evaluate(Expr &&expr, Result &&result)
Compound multiply evaluation of the expr into result.
Definition: evaluator.hpp:1233
constexpr bool is_transformer
Traits indicating if the given ETL type is a transformer expression.
Definition: traits.hpp:297
void assign_add_to(L &&lhs) const
Add to the given left-hand-side expression.
Definition: conv_1d_valid_expr.hpp:148
Selector for the convolution implementations.
decltype(auto) smart_forward_gpu(E &expr)
Smart forwarding for a temporary expression that will be computed in GPU.
Definition: helpers.hpp:343
static size_t dim(const expr_t &e, [[maybe_unused]] size_t d)
Returns the dth dimension of the expression.
Definition: conv_1d_valid_expr.hpp:251
constexpr size_t size(const E &expr) noexcept
Returns the size of the given ETL expression.
Definition: helpers.hpp:108
constexpr bool is_view
Traits indicating if the given ETL type is a view expression.
Definition: traits.hpp:304
std::decay_t< B > right_expr_t
The right sub expression type.
Definition: conv_1d_valid_expr.hpp:207
static constexpr bool gpu_computable
Indicates if the temporary expression can be directly evaluated using only GPU.
Definition: conv_1d_valid_expr.hpp:35
void std_sub_evaluate(Expr &&expr, Result &&result)
Compound subtract evaluation of the expr into result.
Definition: evaluator.hpp:1214
decltype(auto) smart_forward(E &expr)
Smart forwarding for a temporary expression.
Definition: helpers.hpp:323
constexpr bool parallel_support
Indicates if support for parallelization is integrated into the framework.
Definition: config.hpp:51
static size_t size(const expr_t &e)
Returns the size of the expression.
Definition: conv_1d_valid_expr.hpp:260
void assign_div_to(L &&lhs) const
Divide the given left-hand-side expression.
Definition: conv_1d_valid_expr.hpp:175
constexpr bool is_thread_safe
Traits to test if the given ETL expresion type is thread safe.
Definition: traits.hpp:687
conv_1d_valid_expr(A a, B b)
Construct a new expression.
Definition: conv_1d_valid_expr.hpp:41
Contains selectors for convolution implementations.
value_t< A > value_type
The value type of the expression.
Definition: conv_1d_valid_expr.hpp:210
typename decay_traits< E >::value_type value_t
Traits to extract the value type out of an ETL type.
Definition: tmp.hpp:81
void std_div_evaluate(Expr &&expr, Result &&result)
Compound divide evaluation of the expr into result.
Definition: evaluator.hpp:1252
void inc_counter([[maybe_unused]] const char *name)
Increase the given counter.
Definition: counters.hpp:25
decltype(auto) make_temporary(E &&expr)
Make a temporary out of the expression if necessary.
Definition: temporary.hpp:173
std::add_lvalue_reference_t< A > a()
Returns the sub expression.
Definition: base_temporary_expr.hpp:577
void std_add_evaluate(Expr &&expr, Result &&result)
Compound add evaluation of the expr into result.
Definition: evaluator.hpp:1195