wichtounet/etl/conv__1d__full__expr_8hpp_source.html

 //=======================================================================
 // Copyright (c) 2014-2023 Baptiste Wicht
 // Distributed under the terms of the MIT License.
 // (See accompanying file LICENSE or copy at
 //  http://opensource.org/licenses/MIT)
 //=======================================================================

 #pragma once

 #include "etl/expr/base_temporary_expr.hpp"

 //Get the implementations
 #include "etl/impl/conv_select.hpp"
 #include "etl/impl/conv.hpp"

 namespace etl {

 template <typename A, typename B>
 struct conv_1d_full_expr : base_temporary_expr_bin<conv_1d_full_expr<A, B>, A, B> {
     using value_type  = value_t<A>;
     using this_type   = conv_1d_full_expr<A, B>;
     using base_type   = base_temporary_expr_bin<this_type, A, B>;
     using left_traits = decay_traits<A>;

     static constexpr auto storage_order = left_traits::storage_order;

     static constexpr bool gpu_computable = false;

     explicit conv_1d_full_expr(A a, B b) : base_type(a, b) {
         //Nothing else to init
     }

     // Assignment functions

     template <etl_1d I, etl_1d K, etl_1d C>
     static void check([[maybe_unused]] const I& input, [[maybe_unused]] const K& kernel, [[maybe_unused]] const C& conv) {
         if constexpr (all_fast<A, B, C>) {
             static_assert(etl::dim<0, C>() == etl::dim<0, I>() + etl::dim<0, K>() - 1, "Invalid dimensions for conv1_full");
             static_assert(etl::dim<0, I>() >= etl::dim<0, K>(), "Invalid dimensions for conv1_full");
         } else {
             cpp_assert(etl::dim(conv, 0) == etl::dim(input, 0) + etl::dim(kernel, 0) - 1, "Invalid dimensions for conv1_full");
             cpp_assert(etl::dim(input, 0) >= etl::dim(kernel, 0), "Invalid dimensions for conv1_full");
         }
     }

     template <etl_expr C>
     void assign_to(C&& conv) const {
         inc_counter("temp:assign");

         auto& input_raw  = this->a();
         auto& kernel_raw = this->b();

         check(input_raw, kernel_raw, conv);

         // Execute the correct implementation

         constexpr_select const auto impl = detail::select_conv1_impl_new<conv_type::FULL, A, B, C>();

         if constexpr_select (impl == etl::conv_impl::VEC) {
             inc_counter("inc:vec");

             if constexpr (parallel_support) {
                 bool parallel_dispatch = detail::select_parallel(input_raw, kernel_raw, conv);

                 if (parallel_dispatch) {
                     decltype(auto) input  = smart_forward(input_raw);
                     decltype(auto) kernel = smart_forward(kernel_raw);

                     engine_dispatch_1d(
                             [&](size_t first, size_t last) { impl::vec::conv1_full(input, kernel, conv, first, last); }, 0, etl::size(conv), parallel_dispatch);
                 } else {
                     impl::vec::conv1_full(smart_forward(input_raw), smart_forward(kernel_raw), conv, 0, etl::size(conv));
                 }
             } else {
                 impl::standard::conv1_full(smart_forward(input_raw), smart_forward(kernel_raw), conv, 0, etl::size(conv));
             }
         } else if constexpr_select (impl == etl::conv_impl::STD) {
             inc_counter("inc:std");

             if constexpr (parallel_support) {
                 bool parallel_dispatch = detail::select_parallel(input_raw, kernel_raw, conv);

                 if (parallel_dispatch) {
                     decltype(auto) input  = smart_forward(input_raw);
                     decltype(auto) kernel = smart_forward(kernel_raw);

                     engine_dispatch_1d([&](size_t first, size_t last) { impl::standard::conv1_full(input, kernel, conv, first, last); },
                                        0,
                                        etl::size(conv),
                                        parallel_dispatch);
                 } else {
                     impl::standard::conv1_full(smart_forward(input_raw), smart_forward(kernel_raw), conv, 0, etl::size(conv));
                 }
             } else {
                 impl::standard::conv1_full(smart_forward(input_raw), smart_forward(kernel_raw), conv, 0, etl::size(conv));
             }
         } else if constexpr_select (impl == etl::conv_impl::FFT_STD) {
             inc_counter("inc:fft_std");
             impl::standard::conv1_full_fft(smart_forward(input_raw), smart_forward(kernel_raw), conv);
         } else if constexpr_select (impl == etl::conv_impl::FFT_MKL) {
             inc_counter("inc:fft_mkl");
             impl::blas::conv1_full(smart_forward(input_raw), smart_forward(kernel_raw), conv);
         } else if constexpr_select (impl == etl::conv_impl::FFT_CUFFT) {
             inc_counter("inc:fft_cufft");
             impl::cufft::conv1_full(smart_forward_gpu(input_raw), smart_forward_gpu(kernel_raw), conv);
         } else if constexpr_select (impl == etl::conv_impl::EGBLAS) {
             if constexpr (all_homogeneous<A, B, C>) {
                 decltype(auto) input  = smart_forward_gpu(input_raw);
                 decltype(auto) kernel = smart_forward_gpu(kernel_raw);

                 input.ensure_gpu_up_to_date();
                 kernel.ensure_gpu_up_to_date();

                 conv.ensure_gpu_allocated();

                 impl::egblas::conv1_full(
                         etl::size(input_raw), etl::size(kernel_raw), value_type(1), input.gpu_memory(), 1, kernel.gpu_memory(), 1, conv.gpu_memory(), 1);

                 conv.validate_gpu();
                 conv.invalidate_cpu();
             } else {
                 cpp_unreachable("Invalid conv implementation selection");
             }
         } else {
             cpp_unreachable("Invalid conv implementation selection");
         }
     }

     template <typename L>
     void assign_add_to(L&& lhs) const {
         std_add_evaluate(*this, lhs);
     }

     template <typename L>
     void assign_sub_to(L&& lhs) const {
         std_sub_evaluate(*this, lhs);
     }

     template <typename L>
     void assign_mul_to(L&& lhs) const {
         std_mul_evaluate(*this, lhs);
     }

     template <typename L>
     void assign_div_to(L&& lhs) const {
         std_div_evaluate(*this, lhs);
     }

     template <typename L>
     void assign_mod_to(L&& lhs) const {
         std_mod_evaluate(*this, lhs);
     }

     friend std::ostream& operator<<(std::ostream& os, const conv_1d_full_expr& expr) {
         return os << "conv1_full(" << expr._a << ", " << expr._b << ")";
     }
 };

 template <typename A, typename B>
 struct etl_traits<etl::conv_1d_full_expr<A, B>> {
     using expr_t       = etl::conv_1d_full_expr<A, B>;
     using left_expr_t  = std::decay_t<A>;
     using right_expr_t = std::decay_t<B>;
     using left_traits  = etl_traits<left_expr_t>;
     using right_traits = etl_traits<right_expr_t>;
     using value_type   = value_t<A>;

     static constexpr bool is_etl         = true;
     static constexpr bool is_transformer = false;
     static constexpr bool is_view        = false;
     static constexpr bool is_magic_view  = false;
     static constexpr bool is_fast        = all_fast<A, B>;
     static constexpr bool is_linear      = false;
     static constexpr bool is_thread_safe = true;
     static constexpr bool is_value       = false;
     static constexpr bool is_direct      = true;
     static constexpr bool is_generator   = false;
     static constexpr bool is_padded      = false;
     static constexpr bool is_aligned     = true;
     static constexpr bool is_temporary   = true;
     static constexpr bool gpu_computable = is_gpu_t<value_type> && cuda_enabled;
     static constexpr order storage_order = left_traits::storage_order;

     template <vector_mode_t V>
     static constexpr bool vectorizable = true;

     template <size_t DD>
     static constexpr size_t dim() {
         return etl::dim<0, A>() + etl::dim<0, B>() - 1;
     }

     static size_t dim(const expr_t& e, [[maybe_unused]] size_t d) {
         return etl::dim(e._a, 0) + etl::dim(e._b, 0) - 1;
     }

     static size_t size(const expr_t& e) {
         return etl::dim(e._a, 0) + etl::dim(e._b, 0) - 1;
     }

     static constexpr size_t size() {
         return etl::dim<0, A>() + etl::dim<0, B>() - 1;
     }

     static constexpr size_t dimensions() {
         return 1;
     }

     static constexpr int complexity() noexcept {
         return -1;
     }
 };

 template <etl_expr A, etl_expr B>
 conv_1d_full_expr<detail::build_type<A>, detail::build_type<B>> conv_1d_full(A&& a, B&& b) {
     return conv_1d_full_expr<detail::build_type<A>, detail::build_type<B>>{a, b};
 }

 template <etl_expr A, etl_expr B, etl_expr C>
 auto conv_1d_full(A&& a, B&& b, C&& c) {
     c = conv_1d_full(a, b);
     return c;
 }

 } //end of namespace etl
etl::conv_1d_full_expr
A transposition expression.
Definition: conv_1d_full_expr.hpp:23

etl::etl_traits< etl::conv_1d_full_expr< A, B > >::size
static size_t size(const expr_t &e)
Returns the size of the expression.
Definition: conv_1d_full_expr.hpp:265

etl::conv_impl::FFT_MKL
FFT reduction (with MKL impl)

etl::conv_1d_full_expr::assign_sub_to
void assign_sub_to(L &&lhs) const
Sub from the given left-hand-side expression.
Definition: conv_1d_full_expr.hpp:162

etl::conv_1d_full_expr::assign_mod_to
void assign_mod_to(L &&lhs) const
Modulo the given left-hand-side expression.
Definition: conv_1d_full_expr.hpp:189

etl::engine_dispatch_1d
void engine_dispatch_1d(Functor &&functor, size_t first, size_t last, [[maybe_unused]] size_t threshold, [[maybe_unused]] size_t n_threads=etl::threads)
Dispatch the elements of a range to a functor in a parallel manner, using the global thread engine...
Definition: parallel_support.hpp:708

etl::conv_1d_full_expr::value_type
value_t< A > value_type
The type of value of the expression.
Definition: conv_1d_full_expr.hpp:24

etl::base_temporary_expr_bin::_b
B _b
The sub expression reference.
Definition: base_temporary_expr.hpp:534

etl::conv_1d_full_expr::assign_mul_to
void assign_mul_to(L &&lhs) const
Multiply the given left-hand-side expression.
Definition: conv_1d_full_expr.hpp:171

etl::batch_softmax_impl::STD
Standard implementation.

etl::etl_traits< etl::conv_1d_full_expr< A, B > >::dim
static constexpr size_t dim()
Returns the DDth dimension of the expression.
Definition: conv_1d_full_expr.hpp:246

etl::is_magic_view
constexpr bool is_magic_view
Traits indicating if the given ETL type is a magic view expression.
Definition: traits.hpp:311

etl::base_temporary_expr_bin::_a
A _a
The sub expression reference.
Definition: base_temporary_expr.hpp:533

etl::conv_1d_full_expr::gpu_computable
static constexpr bool gpu_computable
Indicates if the temporary expression can be directly evaluated using only GPU.
Definition: conv_1d_full_expr.hpp:35

etl::conv_1d_full_expr::conv_1d_full_expr
conv_1d_full_expr(A a, B b)
Construct a new expression.
Definition: conv_1d_full_expr.hpp:41

etl::conv_1d_full_expr::assign_div_to
void assign_div_to(L &&lhs) const
Divide the given left-hand-side expression.
Definition: conv_1d_full_expr.hpp:180

etl::order
order
Storage order of a matrix.
Definition: order.hpp:15

etl::cuda_enabled
constexpr bool cuda_enabled
Indicates if CUDA is available.
Definition: config.hpp:94

etl::etl_traits< etl::conv_1d_full_expr< A, B > >::right_expr_t
std::decay_t< B > right_expr_t
The right sub expression type.
Definition: conv_1d_full_expr.hpp:212

etl::etl_traits< etl::conv_1d_full_expr< A, B > >::complexity
static constexpr int complexity() noexcept
Estimate the complexity of computation.
Definition: conv_1d_full_expr.hpp:289

etl::base_temporary_expr_bin
Abstract base class for temporary binary expression.
Definition: base_temporary_expr.hpp:529

etl::bias_add_impl::VEC
VEC implementation.

etl::conv_1d_full_expr::check
static void check([[maybe_unused]] const I &input, [[maybe_unused]] const K &kernel, [[maybe_unused]] const C &conv)
Assert that the convolution is done on correct dimensions.
Definition: conv_1d_full_expr.hpp:51

etl::etl_traits< etl::conv_1d_full_expr< A, B > >::dim
static size_t dim(const expr_t &e, [[maybe_unused]] size_t d)
Returns the dth dimension of the expression.
Definition: conv_1d_full_expr.hpp:256

etl::base_temporary_expr_bin< conv_1d_full_expr< A, B >, A, B >::b
std::add_lvalue_reference_t< B > b()
Returns the sub expression.
Definition: base_temporary_expr.hpp:593

etl::is_fast
constexpr bool is_fast
Traits to test if the given ETL expresion type is fast (sizes known at compile-time) ...
Definition: traits.hpp:588

etl::conv_1d_full_expr::operator<<
friend std::ostream & operator<<(std::ostream &os, const conv_1d_full_expr &expr)
Print a representation of the expression on the given stream.
Definition: conv_1d_full_expr.hpp:199

etl::etl_traits
Traits to get information about ETL types.
Definition: tmp.hpp:68

etl
Root namespace for the ETL library.
Definition: adapter.hpp:15

etl::conv_impl::FFT_STD
FFT reduction (with STD impl)

etl::bce_impl::EGBLAS
GPU implementation.

etl::dim
auto dim(E &&value, size_t i) -> detail::identity_helper< E, dim_view< detail::build_identity_type< E >, D >>
Return a view representing the ith Dth dimension.
Definition: view_expression_builder.hpp:25

etl::detail::build_type
std::conditional_t< is_etl_value< T >, const std::decay_t< T > &, std::decay_t< T > > build_type
Helper to build the type for a sub expression.
Definition: expression_helpers.hpp:24

etl::std_mod_evaluate
void std_mod_evaluate(Expr &&expr, Result &&result)
Compound modulo evaluation of the expr into result.
Definition: evaluator.hpp:1271

etl::etl_traits< etl::conv_1d_full_expr< A, B > >::value_type
value_t< A > value_type
The value type of the expression.
Definition: conv_1d_full_expr.hpp:215

etl::std_mul_evaluate
void std_mul_evaluate(Expr &&expr, Result &&result)
Compound multiply evaluation of the expr into result.
Definition: evaluator.hpp:1233

etl::is_transformer
constexpr bool is_transformer
Traits indicating if the given ETL type is a transformer expression.
Definition: traits.hpp:297

etl::etl_traits< etl::conv_1d_full_expr< A, B > >::size
static constexpr size_t size()
Returns the size of the expression.
Definition: conv_1d_full_expr.hpp:273

conv.hpp
Selector for the convolution implementations.

etl::smart_forward_gpu
decltype(auto) smart_forward_gpu(E &expr)
Smart forwarding for a temporary expression that will be computed in GPU.
Definition: helpers.hpp:343

etl::size
constexpr size_t size(const E &expr) noexcept
Returns the size of the given ETL expression.
Definition: helpers.hpp:108

etl::is_view
constexpr bool is_view
Traits indicating if the given ETL type is a view expression.
Definition: traits.hpp:304

etl::std_sub_evaluate
void std_sub_evaluate(Expr &&expr, Result &&result)
Compound subtract evaluation of the expr into result.
Definition: evaluator.hpp:1214

etl::smart_forward
decltype(auto) smart_forward(E &expr)
Smart forwarding for a temporary expression.
Definition: helpers.hpp:323

etl::conv_1d_full_expr::assign_to
void assign_to(C &&conv) const
Assign to a matrix of the same storage order.
Definition: conv_1d_full_expr.hpp:66

etl::parallel_support
constexpr bool parallel_support
Indicates if support for parallelization is integrated into the framework.
Definition: config.hpp:51

etl::is_thread_safe
constexpr bool is_thread_safe
Traits to test if the given ETL expresion type is thread safe.
Definition: traits.hpp:687

etl::conv_1d_full
conv_1d_full_expr< detail::build_type< A >, detail::build_type< B > > conv_1d_full(A &&a, B &&b)
Creates an expression representing the valid 1D convolution of a and b.
Definition: conv_1d_full_expr.hpp:301

etl::conv_1d_full_expr::storage_order
static constexpr auto storage_order
The sub storage order.
Definition: conv_1d_full_expr.hpp:29

conv_select.hpp
Contains selectors for convolution implementations.

etl::value_t
typename decay_traits< E >::value_type value_t
Traits to extract the value type out of an ETL type.
Definition: tmp.hpp:81

etl::std_div_evaluate
void std_div_evaluate(Expr &&expr, Result &&result)
Compound divide evaluation of the expr into result.
Definition: evaluator.hpp:1252

etl::inc_counter
void inc_counter([[maybe_unused]] const char *name)
Increase the given counter.
Definition: counters.hpp:25

etl::conv_1d_full_expr::assign_add_to
void assign_add_to(L &&lhs) const
Add to the given left-hand-side expression.
Definition: conv_1d_full_expr.hpp:153

etl::base_temporary_expr_bin< conv_1d_full_expr< A, B >, A, B >::a
std::add_lvalue_reference_t< A > a()
Returns the sub expression.
Definition: base_temporary_expr.hpp:577

etl::etl_traits< etl::conv_1d_full_expr< A, B > >::left_expr_t
std::decay_t< A > left_expr_t
The left sub expression type.
Definition: conv_1d_full_expr.hpp:211

etl::std_add_evaluate
void std_add_evaluate(Expr &&expr, Result &&result)
Compound add evaluation of the expr into result.
Definition: evaluator.hpp:1195

etl::etl_traits< etl::conv_1d_full_expr< A, B > >::dimensions
static constexpr size_t dimensions()
Returns the number of dimensions of the expression.
Definition: conv_1d_full_expr.hpp:281

etl::conv_impl::FFT_CUFFT
FFT reduction (with CUFFT impl)