#include <kernel_ops.h>
|
| template<typename Expr > |
| static FORCE_INLINE void | eval (T *output, const Expr &expr) noexcept |
| | Evaluation: Dispatch: pick contiguous or permuted eval based on expression layout.
|
| |
| template<typename Expr > |
| static FORCE_INLINE T | reduce_min (const Expr &expr) noexcept |
| |
| template<typename Expr > |
| static FORCE_INLINE T | reduce_max (const Expr &expr) noexcept |
| |
| template<typename Expr > |
| static FORCE_INLINE T | reduce_sum (const Expr &expr) noexcept |
| |
| template<typename Expr1 , typename Expr2 > |
| static FORCE_INLINE bool | reduce_all_approx_equal (const Expr1 &lhs, const Expr2 &rhs, T tolerance) noexcept |
| | Check if all logical elements of two expressions are approximately equal.
|
| |
| template<typename Expr1 , typename Expr2 > |
| static FORCE_INLINE T | dot (const Expr1 &expr1, my_size_t base1, my_size_t stride1, const Expr2 &expr2, my_size_t base2, my_size_t stride2, my_size_t len) noexcept |
| | Dispatch dot product based on stride values.
|
| |
| template<typename Expr1 , typename Expr2 > |
| static FORCE_INLINE T | naive_dot_physical (const Expr1 &expr1, my_size_t base1, my_size_t stride1, const Expr2 &expr2, my_size_t base2, my_size_t stride2, my_size_t len) noexcept |
| | Naive scalar dot product for testing/validation.
|
| |
template<typename T ,
my_size_t Bits, typename Arch >
◆ dot()
template<typename T ,
my_size_t Bits, typename Arch >
template<typename Expr1 , typename Expr2 >
Dispatch dot product based on stride values.
◆ eval()
template<typename T ,
my_size_t Bits, typename Arch >
template<typename Expr >
Evaluation: Dispatch: pick contiguous or permuted eval based on expression layout.
◆ naive_dot_physical()
template<typename T ,
my_size_t Bits, typename Arch >
template<typename Expr1 , typename Expr2 >
Naive scalar dot product for testing/validation.
◆ reduce_all_approx_equal()
template<typename T ,
my_size_t Bits, typename Arch >
template<typename Expr1 , typename Expr2 >
| static FORCE_INLINE bool KernelOps< T, Bits, Arch >::reduce_all_approx_equal |
( |
const Expr1 & |
lhs, |
|
|
const Expr2 & |
rhs, |
|
|
T |
tolerance |
|
) |
| |
|
inlinestaticnoexcept |
Check if all logical elements of two expressions are approximately equal.
◆ reduce_max()
template<typename T ,
my_size_t Bits, typename Arch >
template<typename Expr >
◆ reduce_min()
template<typename T ,
my_size_t Bits, typename Arch >
template<typename Expr >
◆ reduce_sum()
template<typename T ,
my_size_t Bits, typename Arch >
template<typename Expr >
◆ simdWidth
template<typename T ,
my_size_t Bits, typename Arch >
The documentation for this struct was generated from the following file: