wichtounet/etl/op_2unary_2log2_8hpp_source.html

 //=======================================================================
 // Copyright (c) 2014-2023 Baptiste Wicht
 // Distributed under the terms of the MIT License.
 // (See accompanying file LICENSE or copy at
 //  http://opensource.org/licenses/MIT)
 //=======================================================================

 #pragma once

 #include "etl/impl/egblas/log2.hpp"

 namespace etl {

 template <typename T>
 struct log2_unary_op {
     static constexpr bool linear      = true;
     static constexpr bool thread_safe = true;

     template <vector_mode_t V>
     static constexpr bool vectorizable =
         (V == vector_mode_t::SSE3 && is_single_precision_t<T>) || (V == vector_mode_t::AVX && is_single_precision_t<T>) || (intel_compiler && !is_complex_t<T>);

     template <typename E>
     static constexpr bool gpu_computable = (is_single_precision_t<T> && impl::egblas::has_slog2) || (is_double_precision_t<T> && impl::egblas::has_dlog2)
                                            || (is_complex_single_t<T> && impl::egblas::has_clog2) || (is_complex_double_t<T> && impl::egblas::has_zlog2);

     static constexpr int complexity() {
         return 12;
     }

     template <typename V = default_vec>
     using vec_type = typename V::template vec_type<T>;

     static constexpr T apply(const T& x) {
         return std::log2(x);
     }

     template <typename V = default_vec>
     static vec_type<V> load(const vec_type<V>& x) noexcept {
         return V::div(V::log(x), V::log(V::set(T(2))));
     }

     template <typename X, typename Y>
     static auto gpu_compute_hint(const X& x, Y& y) noexcept {
         decltype(auto) t1 = smart_gpu_compute_hint(x, y);

         auto t2 = force_temporary_gpu_dim_only(t1);

         T alpha(1.0);
         impl::egblas::log2(etl::size(y), alpha, t1.gpu_memory(), 1, t2.gpu_memory(), 1);

         return t2;
     }

     template <typename X, typename Y>
     static Y& gpu_compute(const X& x, Y& y) noexcept {
         decltype(auto) t1 = select_smart_gpu_compute(x, y);

         T alpha(1.0);
         impl::egblas::log2(etl::size(y), alpha, t1.gpu_memory(), 1, y.gpu_memory(), 1);

         y.validate_gpu();
         y.invalidate_cpu();

         return y;
     }

     static std::string desc() noexcept {
         return "log2";
     }
 };

 template <typename TT>
 struct log2_unary_op<std::complex<TT>> {
     using T = std::complex<TT>;

     static constexpr bool linear      = true;
     static constexpr bool thread_safe = true;

     template <vector_mode_t V>
     static constexpr bool vectorizable = false;

     template <typename E>
     static constexpr bool gpu_computable = (is_single_precision_t<T> && impl::egblas::has_slog2) || (is_double_precision_t<T> && impl::egblas::has_dlog2)
                                            || (is_complex_single_t<T> && impl::egblas::has_clog2) || (is_complex_double_t<T> && impl::egblas::has_zlog2);

     static constexpr int complexity() {
         return 12;
     }

     static constexpr T apply(const T& x) {
         return std::log(x) / std::log(T{TT(2)});
     }

     template <typename X, typename Y>
     static auto gpu_compute_hint(const X& x, Y& y) noexcept {
         decltype(auto) t1 = smart_gpu_compute_hint(x, y);

         auto t2 = force_temporary_gpu_dim_only(t1);

         T alpha(1.0);
         impl::egblas::log2(etl::size(y), alpha, t1.gpu_memory(), 1, t2.gpu_memory(), 1);

         return t2;
     }

     template <typename X, typename Y>
     static Y& gpu_compute(const X& x, Y& y) noexcept {
         decltype(auto) t1 = select_smart_gpu_compute(x, y);

         T alpha(1.0);
         impl::egblas::log2(etl::size(y), alpha, t1.gpu_memory(), 1, y.gpu_memory(), 1);

         y.validate_gpu();
         y.invalidate_cpu();

         return y;
     }

     static std::string desc() noexcept {
         return "log2";
     }
 };

 template <typename TT>
 struct log2_unary_op<etl::complex<TT>> {
     using T = etl::complex<TT>;

     static constexpr bool linear      = true;
     static constexpr bool thread_safe = true;

     template <vector_mode_t V>
     static constexpr bool vectorizable = false;

     template <typename E>
     static constexpr bool gpu_computable = (is_single_precision_t<T> && impl::egblas::has_slog2) || (is_double_precision_t<T> && impl::egblas::has_dlog2)
                                            || (is_complex_single_t<T> && impl::egblas::has_clog2) || (is_complex_double_t<T> && impl::egblas::has_zlog2);

     static constexpr int complexity() {
         return 12;
     }

     static constexpr T apply(const T& x) {
         return etl::log2(x);
     }

     template <typename X, typename Y>
     static auto gpu_compute_hint(const X& x, Y& y) noexcept {
         decltype(auto) t1 = smart_gpu_compute_hint(x, y);

         auto t2 = force_temporary_gpu_dim_only(t1);

         T alpha(1.0);
         impl::egblas::log2(etl::size(y), alpha, t1.gpu_memory(), 1, t2.gpu_memory(), 1);

         return t2;
     }

     template <typename X, typename Y>
     static Y& gpu_compute(const X& x, Y& y) noexcept {
         decltype(auto) t1 = select_smart_gpu_compute(x, y);

         T alpha(1.0);
         impl::egblas::log2(etl::size(y), alpha, t1.gpu_memory(), 1, y.gpu_memory(), 1);

         y.validate_gpu();
         y.invalidate_cpu();

         return y;
     }

     static std::string desc() noexcept {
         return "log2";
     }
 };

 } //end of namespace etl
etl::log2_unary_op< std::complex< TT > >::apply
static constexpr T apply(const T &x)
Apply the unary operator on x.
Definition: log2.hpp:158

etl::log2_unary_op::load
static vec_type< V > load(const vec_type< V > &x) noexcept
Compute several applications of the operator at a time.
Definition: log2.hpp:69

etl::complex
Complex number implementation.
Definition: complex.hpp:31

etl::log2
auto log2(E &&value) -> detail::unary_helper< E, log2_unary_op >
Apply logarithm (base 2) on each value of the given expression.
Definition: function_expression_builder.hpp:74

etl::log2_unary_op< std::complex< TT > >::gpu_compute_hint
static auto gpu_compute_hint(const X &x, Y &y) noexcept
Compute the result of the operation using the GPU.
Definition: log2.hpp:170

etl::log2_unary_op< etl::complex< TT > >::gpu_compute
static Y & gpu_compute(const X &x, Y &y) noexcept
Compute the result of the operation using the GPU.
Definition: log2.hpp:277

etl::log2_unary_op< etl::complex< TT > >::apply
static constexpr T apply(const T &x)
Apply the unary operator on x.
Definition: log2.hpp:247

etl::select_smart_gpu_compute
decltype(auto) select_smart_gpu_compute(X &x, Y &y)
Compute the expression into a representation that is GPU up to date and possibly store this represent...
Definition: helpers.hpp:434

etl::log2_unary_op::vectorizable
static constexpr bool vectorizable
Indicates if the expression is vectorizable using the given vector mode.
Definition: log2.hpp:29

etl::vector_mode_t::SSE3
SSE3 is the max vectorization available.

etl::intel_compiler
constexpr bool intel_compiler
Indicates if the projectis compiled with intel compiler.
Definition: config.hpp:225

etl::log2_unary_op< etl::complex< TT > >::complexity
static constexpr int complexity()
Estimate the complexity of operator.
Definition: log2.hpp:238

etl
Root namespace for the ETL library.
Definition: adapter.hpp:15

etl::log2_unary_op::desc
static std::string desc() noexcept
Returns a textual representation of the operator.
Definition: log2.hpp:115

etl::log2_unary_op
Unary operation taking the logarithmic value (base 2)
Definition: log2.hpp:19

etl::log2_unary_op< etl::complex< TT > >::gpu_compute_hint
static auto gpu_compute_hint(const X &x, Y &y) noexcept
Compute the result of the operation using the GPU.
Definition: log2.hpp:259

etl::log2_unary_op::complexity
static constexpr int complexity()
Estimate the complexity of operator.
Definition: log2.hpp:43

log2.hpp
EGBLAS wrappers for the log operation.

etl::log2_unary_op< etl::complex< TT > >::desc
static std::string desc() noexcept
Returns a textual representation of the operator.
Definition: log2.hpp:293

etl::force_temporary_gpu_dim_only
decltype(auto) force_temporary_gpu_dim_only(E &&expr)
Force a temporary out of the expression, without copying its content.
Definition: temporary.hpp:223

etl::size
constexpr size_t size(const E &expr) noexcept
Returns the size of the given ETL expression.
Definition: helpers.hpp:108

etl::log2_unary_op::thread_safe
static constexpr bool thread_safe
Indicates if the operator is thread safe or not.
Definition: log2.hpp:21

etl::log2_unary_op::apply
static constexpr T apply(const T &x)
Apply the unary operator on x.
Definition: log2.hpp:58

etl::log2_unary_op::gpu_computable
static constexpr bool gpu_computable
Indicates if the operator can be computed on GPU.
Definition: log2.hpp:36

etl::vector_mode_t::AVX
AVX is the max vectorization available.

etl::log2_unary_op::gpu_compute_hint
static auto gpu_compute_hint(const X &x, Y &y) noexcept
Compute the result of the operation using the GPU.
Definition: log2.hpp:81

etl::log2_unary_op::gpu_compute
static Y & gpu_compute(const X &x, Y &y) noexcept
Compute the result of the operation using the GPU.
Definition: log2.hpp:99

etl::smart_gpu_compute_hint
decltype(auto) smart_gpu_compute_hint(E &expr, Y &y)
Compute the expression into a representation that is GPU up to date.
Definition: helpers.hpp:368

etl::log2_unary_op::vec_type
typename V::template vec_type< T > vec_type
Definition: log2.hpp:51

etl::log
auto log(E &&value) -> detail::unary_helper< E, log_unary_op >
Apply logarithm (base e) on each value of the given expression.
Definition: function_expression_builder.hpp:64

etl::log2_unary_op< std::complex< TT > >::T
std::complex< TT > T
The real type.
Definition: log2.hpp:125

etl::log2_unary_op::linear
static constexpr bool linear
Indicates if the operator is linear.
Definition: log2.hpp:20

etl::log2_unary_op< std::complex< TT > >::desc
static std::string desc() noexcept
Returns a textual representation of the operator.
Definition: log2.hpp:204

etl::log2_unary_op< std::complex< TT > >::gpu_compute
static Y & gpu_compute(const X &x, Y &y) noexcept
Compute the result of the operation using the GPU.
Definition: log2.hpp:188

etl::log2_unary_op< std::complex< TT > >::complexity
static constexpr int complexity()
Estimate the complexity of operator.
Definition: log2.hpp:149