10 #include "etl/expr/base_temporary_expr.hpp" 22 template <
typename A,
typename B>
50 template <etl_1d I, etl_1d K, etl_1d C>
51 static void check([[maybe_unused]]
const I& input, [[maybe_unused]]
const K& kernel, [[maybe_unused]]
const C& conv) {
52 if constexpr (all_fast<A, B, C>) {
53 static_assert(etl::dim<0, C>() == etl::dim<0, I>() + etl::dim<0, K>() - 1,
"Invalid dimensions for conv1_full");
54 static_assert(etl::dim<0, I>() >= etl::dim<0, K>(),
"Invalid dimensions for conv1_full");
57 cpp_assert(
etl::dim(input, 0) >=
etl::dim(kernel, 0),
"Invalid dimensions for conv1_full");
69 auto& input_raw = this->
a();
70 auto& kernel_raw = this->
b();
72 check(input_raw, kernel_raw, conv);
76 constexpr_select
const auto impl = detail::select_conv1_impl_new<conv_type::FULL, A, B, C>();
82 bool parallel_dispatch = detail::select_parallel(input_raw, kernel_raw, conv);
84 if (parallel_dispatch) {
89 [&](
size_t first,
size_t last) { impl::vec::conv1_full(input, kernel, conv, first, last); }, 0,
etl::size(conv), parallel_dispatch);
100 bool parallel_dispatch = detail::select_parallel(input_raw, kernel_raw, conv);
102 if (parallel_dispatch) {
106 engine_dispatch_1d([&](
size_t first,
size_t last) { impl::standard::conv1_full(input, kernel, conv, first, last); },
126 if constexpr (all_homogeneous<A, B, C>) {
130 input.ensure_gpu_up_to_date();
131 kernel.ensure_gpu_up_to_date();
133 conv.ensure_gpu_allocated();
135 impl::egblas::conv1_full(
139 conv.invalidate_cpu();
141 cpp_unreachable(
"Invalid conv implementation selection");
144 cpp_unreachable(
"Invalid conv implementation selection");
152 template <
typename L>
161 template <
typename L>
170 template <
typename L>
179 template <
typename L>
188 template <
typename L>
200 return os <<
"conv1_full(" << expr.
_a <<
", " << expr.
_b <<
")";
208 template <
typename A,
typename B>
217 static constexpr
bool is_etl =
true;
221 static constexpr
bool is_fast = all_fast<A, B>;
222 static constexpr
bool is_linear =
false;
224 static constexpr
bool is_value =
false;
225 static constexpr
bool is_direct =
true;
226 static constexpr
bool is_generator =
false;
227 static constexpr
bool is_padded =
false;
228 static constexpr
bool is_aligned =
true;
229 static constexpr
bool is_temporary =
true;
238 template <vector_mode_t V>
239 static constexpr
bool vectorizable =
true;
246 static constexpr
size_t dim() {
247 return etl::dim<0, A>() + etl::dim<0, B>() - 1;
256 static size_t dim(
const expr_t& e, [[maybe_unused]]
size_t d) {
273 static constexpr
size_t size() {
274 return etl::dim<0, A>() + etl::dim<0, B>() - 1;
300 template <etl_expr A, etl_expr B>
312 template <etl_expr A, etl_expr B, etl_expr C>
A transposition expression.
Definition: conv_1d_full_expr.hpp:23
static size_t size(const expr_t &e)
Returns the size of the expression.
Definition: conv_1d_full_expr.hpp:265
FFT reduction (with MKL impl)
void assign_sub_to(L &&lhs) const
Sub from the given left-hand-side expression.
Definition: conv_1d_full_expr.hpp:162
void assign_mod_to(L &&lhs) const
Modulo the given left-hand-side expression.
Definition: conv_1d_full_expr.hpp:189
void engine_dispatch_1d(Functor &&functor, size_t first, size_t last, [[maybe_unused]] size_t threshold, [[maybe_unused]] size_t n_threads=etl::threads)
Dispatch the elements of a range to a functor in a parallel manner, using the global thread engine...
Definition: parallel_support.hpp:708
value_t< A > value_type
The type of value of the expression.
Definition: conv_1d_full_expr.hpp:24
B _b
The sub expression reference.
Definition: base_temporary_expr.hpp:534
void assign_mul_to(L &&lhs) const
Multiply the given left-hand-side expression.
Definition: conv_1d_full_expr.hpp:171
static constexpr size_t dim()
Returns the DDth dimension of the expression.
Definition: conv_1d_full_expr.hpp:246
constexpr bool is_magic_view
Traits indicating if the given ETL type is a magic view expression.
Definition: traits.hpp:311
A _a
The sub expression reference.
Definition: base_temporary_expr.hpp:533
static constexpr bool gpu_computable
Indicates if the temporary expression can be directly evaluated using only GPU.
Definition: conv_1d_full_expr.hpp:35
conv_1d_full_expr(A a, B b)
Construct a new expression.
Definition: conv_1d_full_expr.hpp:41
void assign_div_to(L &&lhs) const
Divide the given left-hand-side expression.
Definition: conv_1d_full_expr.hpp:180
order
Storage order of a matrix.
Definition: order.hpp:15
constexpr bool cuda_enabled
Indicates if CUDA is available.
Definition: config.hpp:94
std::decay_t< B > right_expr_t
The right sub expression type.
Definition: conv_1d_full_expr.hpp:212
static constexpr int complexity() noexcept
Estimate the complexity of computation.
Definition: conv_1d_full_expr.hpp:289
Abstract base class for temporary binary expression.
Definition: base_temporary_expr.hpp:529
static void check([[maybe_unused]] const I &input, [[maybe_unused]] const K &kernel, [[maybe_unused]] const C &conv)
Assert that the convolution is done on correct dimensions.
Definition: conv_1d_full_expr.hpp:51
static size_t dim(const expr_t &e, [[maybe_unused]] size_t d)
Returns the dth dimension of the expression.
Definition: conv_1d_full_expr.hpp:256
std::add_lvalue_reference_t< B > b()
Returns the sub expression.
Definition: base_temporary_expr.hpp:593
constexpr bool is_fast
Traits to test if the given ETL expresion type is fast (sizes known at compile-time) ...
Definition: traits.hpp:588
friend std::ostream & operator<<(std::ostream &os, const conv_1d_full_expr &expr)
Print a representation of the expression on the given stream.
Definition: conv_1d_full_expr.hpp:199
Traits to get information about ETL types.
Definition: tmp.hpp:68
Root namespace for the ETL library.
Definition: adapter.hpp:15
FFT reduction (with STD impl)
auto dim(E &&value, size_t i) -> detail::identity_helper< E, dim_view< detail::build_identity_type< E >, D >>
Return a view representing the ith Dth dimension.
Definition: view_expression_builder.hpp:25
std::conditional_t< is_etl_value< T >, const std::decay_t< T > &, std::decay_t< T > > build_type
Helper to build the type for a sub expression.
Definition: expression_helpers.hpp:24
void std_mod_evaluate(Expr &&expr, Result &&result)
Compound modulo evaluation of the expr into result.
Definition: evaluator.hpp:1271
value_t< A > value_type
The value type of the expression.
Definition: conv_1d_full_expr.hpp:215
void std_mul_evaluate(Expr &&expr, Result &&result)
Compound multiply evaluation of the expr into result.
Definition: evaluator.hpp:1233
constexpr bool is_transformer
Traits indicating if the given ETL type is a transformer expression.
Definition: traits.hpp:297
static constexpr size_t size()
Returns the size of the expression.
Definition: conv_1d_full_expr.hpp:273
Selector for the convolution implementations.
decltype(auto) smart_forward_gpu(E &expr)
Smart forwarding for a temporary expression that will be computed in GPU.
Definition: helpers.hpp:343
constexpr size_t size(const E &expr) noexcept
Returns the size of the given ETL expression.
Definition: helpers.hpp:108
constexpr bool is_view
Traits indicating if the given ETL type is a view expression.
Definition: traits.hpp:304
void std_sub_evaluate(Expr &&expr, Result &&result)
Compound subtract evaluation of the expr into result.
Definition: evaluator.hpp:1214
decltype(auto) smart_forward(E &expr)
Smart forwarding for a temporary expression.
Definition: helpers.hpp:323
void assign_to(C &&conv) const
Assign to a matrix of the same storage order.
Definition: conv_1d_full_expr.hpp:66
constexpr bool parallel_support
Indicates if support for parallelization is integrated into the framework.
Definition: config.hpp:51
constexpr bool is_thread_safe
Traits to test if the given ETL expresion type is thread safe.
Definition: traits.hpp:687
conv_1d_full_expr< detail::build_type< A >, detail::build_type< B > > conv_1d_full(A &&a, B &&b)
Creates an expression representing the valid 1D convolution of a and b.
Definition: conv_1d_full_expr.hpp:301
static constexpr auto storage_order
The sub storage order.
Definition: conv_1d_full_expr.hpp:29
Contains selectors for convolution implementations.
typename decay_traits< E >::value_type value_t
Traits to extract the value type out of an ETL type.
Definition: tmp.hpp:81
void std_div_evaluate(Expr &&expr, Result &&result)
Compound divide evaluation of the expr into result.
Definition: evaluator.hpp:1252
void inc_counter([[maybe_unused]] const char *name)
Increase the given counter.
Definition: counters.hpp:25
void assign_add_to(L &&lhs) const
Add to the given left-hand-side expression.
Definition: conv_1d_full_expr.hpp:153
std::add_lvalue_reference_t< A > a()
Returns the sub expression.
Definition: base_temporary_expr.hpp:577
std::decay_t< A > left_expr_t
The left sub expression type.
Definition: conv_1d_full_expr.hpp:211
void std_add_evaluate(Expr &&expr, Result &&result)
Compound add evaluation of the expr into result.
Definition: evaluator.hpp:1195
static constexpr size_t dimensions()
Returns the number of dimensions of the expression.
Definition: conv_1d_full_expr.hpp:281
FFT reduction (with CUFFT impl)