Expression Templates Library (ETL)
transpose_expr.hpp
1 //=======================================================================
2 // Copyright (c) 2014-2023 Baptiste Wicht
3 // Distributed under the terms of the MIT License.
4 // (See accompanying file LICENSE or copy at
5 // http://opensource.org/licenses/MIT)
6 //=======================================================================
7 
8 #pragma once
9 
10 #include "etl/expr/base_temporary_expr.hpp"
11 
12 //Get the implementations
13 #include "etl/impl/transpose.hpp"
14 
15 namespace etl {
16 
21 template <typename A>
22 struct transpose_expr : base_temporary_expr_un<transpose_expr<A>, A> {
27 
28  static constexpr auto storage_order = sub_traits::storage_order;
29 
34  static constexpr bool gpu_computable = cublas_enabled && all_floating<A>;
35 
40  explicit transpose_expr(A a) : base_type(a) {
41  //Nothing else to init
42  }
43 
49  template <typename C>
50  static void check([[maybe_unused]] const A& a, [[maybe_unused]] const C& c) {
51  static constexpr etl::order order_lhs = decay_traits<C>::storage_order;
52  static constexpr etl::order order_rhs = decay_traits<A>::storage_order;
53 
54  [[maybe_unused]] static constexpr bool rm_to_rm = order_lhs == etl::order::RowMajor && order_rhs == etl::order::RowMajor;
55  [[maybe_unused]] static constexpr bool cm_to_cm = order_lhs == etl::order::ColumnMajor && order_rhs == etl::order::ColumnMajor;
56  [[maybe_unused]] static constexpr bool rm_to_cm = order_lhs == etl::order::RowMajor && order_rhs == etl::order::ColumnMajor;
57  [[maybe_unused]] static constexpr bool cm_to_rm = order_lhs == etl::order::ColumnMajor && order_rhs == etl::order::RowMajor;
58 
59  if constexpr (all_fast<A, C>) {
60  static constexpr size_t L1 = decay_traits<C>::template dim<0>();
61  static constexpr size_t L2 = decay_traits<C>::template dim<1>();
62  static constexpr size_t R1 = decay_traits<A>::template dim<0>();
63  static constexpr size_t R2 = decay_traits<A>::template dim<1>();
64 
65  // Case 1: RM -> RM
66  static_assert(!rm_to_rm || (L1 == R2 && L2 == R1), "Invalid dimensions for transposition");
67 
68  // Case 2: CM -> CM
69  static_assert(!cm_to_cm || (L1 == R2 && L2 == R1), "Invalid dimensions for transposition");
70 
71  // Case 3: RM -> CM (two possible cases)
72  static_assert(!rm_to_cm || ((L1 == R2 && L2 == R1) || (L1 == R1 && L2 == R2)), "Invalid dimensions for transposition");
73 
74  // Case 4: RM -> CM (two possible cases)
75  static_assert(!cm_to_rm || ((L1 == R2 && L2 == R1) || (L1 == R1 && L2 == R2)), "Invalid dimensions for transposition");
76  } else {
77  [[maybe_unused]] const size_t L1 = etl::dim<0>(c);
78  [[maybe_unused]] const size_t L2 = etl::dim<1>(c);
79  [[maybe_unused]] const size_t R1 = etl::dim<0>(a);
80  [[maybe_unused]] const size_t R2 = etl::dim<1>(a);
81 
82  // Case 1: RM -> RM
83  cpp_assert(!rm_to_rm || (L1 == R2 && L2 == R1), "Invalid dimensions for transposition");
84 
85  // Case 2: CM -> CM
86  cpp_assert(!cm_to_cm || (L1 == R2 && L2 == R1), "Invalid dimensions for transposition");
87 
88  // Case 3: RM -> CM (two possible cases)
89  cpp_assert(!rm_to_cm || ((L1 == R2 && L2 == R1) || (L1 == R1 && L2 == R2)), "Invalid dimensions for transposition");
90 
91  // Case 4: RM -> CM (two possible cases)
92  cpp_assert(!cm_to_rm || ((L1 == R2 && L2 == R1) || (L1 == R1 && L2 == R2)), "Invalid dimensions for transposition");
93  }
94  }
95 
96  // Assignment functions
97 
102  template <etl_expr C>
103  void assign_to(C&& c) const {
104  if constexpr (decay_traits<C>::storage_order == storage_order) {
105  inc_counter("temp:assign");
106 
107  auto& a = this->a();
108 
109  check(a, c);
110 
112  } else {
113  std_assign_evaluate(*this, c);
114  }
115  }
116 
121  template <typename L>
122  void assign_add_to(L&& lhs) const {
123  std_add_evaluate(*this, std::forward<L>(lhs));
124  }
125 
130  template <typename L>
131  void assign_sub_to(L&& lhs) const {
132  std_sub_evaluate(*this, std::forward<L>(lhs));
133  }
134 
139  template <typename L>
140  void assign_mul_to(L&& lhs) const {
141  std_mul_evaluate(*this, std::forward<L>(lhs));
142  }
143 
148  template <typename L>
149  void assign_div_to(L&& lhs) const {
150  std_div_evaluate(*this, std::forward<L>(lhs));
151  }
152 
157  template <typename L>
158  void assign_mod_to(L&& lhs) const {
159  std_mod_evaluate(*this, std::forward<L>(lhs));
160  }
161 
168  friend std::ostream& operator<<(std::ostream& os, const transpose_expr& expr) {
169  return os << "trans(" << expr._a << ")";
170  }
171 };
172 
177 template <typename A>
180  using sub_expr_t = std::decay_t<A>;
183 
184  static constexpr bool is_etl = true;
185  static constexpr bool is_transformer = false;
186  static constexpr bool is_view = false;
187  static constexpr bool is_magic_view = false;
188  static constexpr bool is_fast = sub_traits::is_fast;
189  static constexpr bool is_linear = true;
190  static constexpr bool is_thread_safe = true;
191  static constexpr bool is_value = false;
192  static constexpr bool is_direct = true;
193  static constexpr bool is_generator = false;
194  static constexpr bool is_padded = false;
195  static constexpr bool is_aligned = true;
196  static constexpr bool is_temporary = true;
197  static constexpr bool gpu_computable = is_gpu_t<value_type> && cuda_enabled;
198  static constexpr order storage_order = sub_traits::storage_order;
199 
205  template <vector_mode_t V>
206  static constexpr bool vectorizable = true;
207 
212  template <size_t DD>
213  static constexpr size_t dim() {
214  return DD == 0 ? decay_traits<A>::template dim<1>() : decay_traits<A>::template dim<0>();
215  }
216 
223  static size_t dim(const expr_t& e, size_t d) {
224  return d == 0 ? etl::dim<1>(e._a) : etl::dim<0>(e._a);
225  }
226 
232  static size_t size(const expr_t& e) {
233  return etl::size(e._a);
234  }
235 
240  static constexpr size_t size() {
241  return decay_traits<A>::size();
242  }
243 
248  static constexpr size_t dimensions() {
249  return 2;
250  }
251 
256  static constexpr int complexity() noexcept {
257  return -1;
258  }
259 };
260 
261 } //end of namespace etl
std::decay_t< A > sub_expr_t
The sub expression type.
Definition: transpose_expr.hpp:180
static void apply(A &&a, C &&c)
Tranpose a and store the results in c.
Definition: transpose.hpp:336
std::add_lvalue_reference_t< A > a()
Returns the sub expression.
Definition: base_temporary_expr.hpp:489
void std_assign_evaluate(Expr &&expr, Result &&result)
Evaluation of the expr into result.
Definition: evaluator.hpp:1176
transpose_expr(A a)
Construct a new expression.
Definition: transpose_expr.hpp:40
constexpr bool is_magic_view
Traits indicating if the given ETL type is a magic view expression.
Definition: traits.hpp:311
static size_t size(const expr_t &e)
Returns the size of the expression.
Definition: transpose_expr.hpp:232
void assign_to(C &&c) const
Assign to a matrix of the same storage order.
Definition: transpose_expr.hpp:103
value_t< A > value_type
The type of value of the expression.
Definition: transpose_expr.hpp:23
static constexpr size_t dimensions()
Returns the number of dimensions of the expression.
Definition: transpose_expr.hpp:248
order
Storage order of a matrix.
Definition: order.hpp:15
constexpr bool cuda_enabled
Indicates if CUDA is available.
Definition: config.hpp:94
static constexpr bool gpu_computable
Indicates if the temporary expression can be directly evaluated using only GPU.
Definition: transpose_expr.hpp:34
A _a
The sub expression reference.
Definition: base_temporary_expr.hpp:447
Implementations of inplace matrix transposition.
constexpr bool is_fast
Traits to test if the given ETL expresion type is fast (sizes known at compile-time) ...
Definition: traits.hpp:588
static constexpr size_t size()
Returns the size of the expression.
Definition: transpose_expr.hpp:240
Traits to get information about ETL types.
Definition: tmp.hpp:68
Root namespace for the ETL library.
Definition: adapter.hpp:15
value_t< A > value_type
The value type of the expression.
Definition: transpose_expr.hpp:182
void assign_sub_to(L &&lhs) const
Sub from the given left-hand-side expression.
Definition: transpose_expr.hpp:131
constexpr bool cublas_enabled
Indicates if the NVIDIA CUBLAS library is available for ETL.
Definition: config.hpp:99
void assign_mul_to(L &&lhs) const
Multiply the given left-hand-side expression.
Definition: transpose_expr.hpp:140
void std_mod_evaluate(Expr &&expr, Result &&result)
Compound modulo evaluation of the expr into result.
Definition: evaluator.hpp:1271
void assign_div_to(L &&lhs) const
Divide the given left-hand-side expression.
Definition: transpose_expr.hpp:149
static constexpr int complexity() noexcept
Estimate the complexity of computation.
Definition: transpose_expr.hpp:256
void std_mul_evaluate(Expr &&expr, Result &&result)
Compound multiply evaluation of the expr into result.
Definition: evaluator.hpp:1233
constexpr bool is_transformer
Traits indicating if the given ETL type is a transformer expression.
Definition: traits.hpp:297
static constexpr auto storage_order
The sub storage order.
Definition: transpose_expr.hpp:28
static void check([[maybe_unused]] const A &a, [[maybe_unused]] const C &c)
Validate the transposition dimensions.
Definition: transpose_expr.hpp:50
Column-Major storage.
constexpr size_t size(const E &expr) noexcept
Returns the size of the given ETL expression.
Definition: helpers.hpp:108
constexpr bool is_view
Traits indicating if the given ETL type is a view expression.
Definition: traits.hpp:304
A transposition expression.
Definition: transpose_expr.hpp:22
friend std::ostream & operator<<(std::ostream &os, const transpose_expr &expr)
Print a representation of the expression on the given stream.
Definition: transpose_expr.hpp:168
static constexpr bool is_fast
Indicates if T is a fast structure.
Definition: traits_base.hpp:25
void std_sub_evaluate(Expr &&expr, Result &&result)
Compound subtract evaluation of the expr into result.
Definition: evaluator.hpp:1214
Abstract base class for temporary unary expression.
Definition: base_temporary_expr.hpp:443
constexpr bool is_thread_safe
Traits to test if the given ETL expresion type is thread safe.
Definition: traits.hpp:687
void assign_mod_to(L &&lhs) const
Modulo the given left-hand-side expression.
Definition: transpose_expr.hpp:158
static size_t dim(const expr_t &e, size_t d)
Returns the dth dimension of the expression.
Definition: transpose_expr.hpp:223
void assign_add_to(L &&lhs) const
Add to the given left-hand-side expression.
Definition: transpose_expr.hpp:122
typename decay_traits< E >::value_type value_t
Traits to extract the value type out of an ETL type.
Definition: tmp.hpp:81
void std_div_evaluate(Expr &&expr, Result &&result)
Compound divide evaluation of the expr into result.
Definition: evaluator.hpp:1252
Row-Major storage.
void inc_counter([[maybe_unused]] const char *name)
Increase the given counter.
Definition: counters.hpp:25
static constexpr size_t dim()
Returns the DDth dimension of the expression.
Definition: transpose_expr.hpp:213
void std_add_evaluate(Expr &&expr, Result &&result)
Compound add evaluation of the expr into result.
Definition: evaluator.hpp:1195