|
template<Elem E> |
constexpr auto | abs (const E &a) -> operand_base_type_t< E > |
| Compute the absolute value of a value.
|
|
template<Vector Vec> |
constexpr auto | abs (const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Compute the absolute value for each element in the given vector.
|
|
template<ComplexElem E> |
constexpr auto | abs_square (const E &v) -> detail::utils::get_complex_component_type_t< operand_base_type_t< E > > |
| Compute the absolute square of a scalar complex value.
|
|
template<typename TR = int32, ComplexVector Vec>
requires (Utils::is_one_of_v<TR, int32, int16>) |
constexpr auto | abs_square (const Vec &v, int shift=0) |
| Compute the absolute square of each element in the given complex vector.
|
|
template<unsigned Elems>
requires (arch::is(arch::AIE) || (arch::is(arch::AIE_ML) && __AIE_API_COMPLEX_FP32_EMULATION__ == 1)) |
constexpr vector< float, Elems > | abs_square (const vector< cfloat, Elems > &v) |
| Compute the absolute square of each element in the given complex vector.
|
|
template<detail::NativeAccumType T> |
| accum (T) -> accum< typename detail::native_accum_traits< T >::value_type, detail::native_accum_traits< T >::elems > |
| Template deduction guidelines for aie::accum.
|
|
template<unsigned Lanes, AccumOrOp Acc, Vector VecCoeff, Vector VecData, Vector... NextVecData>
requires ((is_same_vector_v<VecData, NextVecData> && ...) && Acc::size() == Lanes && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | accumulate (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &data, const NextVecData &...next_data) -> operand_base_type_t< Acc > |
| Performs a weighted addition over multiple vectors and accumulates the result into an existing accumulator.
|
|
template<unsigned Lanes, unsigned CoeffStart = 0, AccumElemBaseType AccumTag = accauto, Vector VecCoeff, Vector VecData, Vector... NextVecData> |
auto | accumulate (const VecCoeff &coeff, const VecData &data, const NextVecData &...next_data) |
|
template<unsigned Lanes, AccumElemBaseType AccumTag = accauto, Vector VecCoeff, Vector VecData, Vector... NextVecData>
requires ((is_same_vector_v<VecData, NextVecData> && ...)) |
auto | accumulate (const VecCoeff &coeff, unsigned coeff_start, const VecData &data, const NextVecData &...next_data) -> accum< detail::accum_tag_or_default_t< AccumTag, typename VecCoeff::value_type, typename VecData::value_type >, Lanes > |
| Performs a weighted addition over multiple vectors.
|
|
template<AccumOrOp Acc, Vector Vec>
requires (Acc::size() == Vec::size()) |
auto | add (const Acc &acc, const Vec &v) -> result_type_t< Acc > |
| Returns an accumulator with the element-wise addition of the input accumulator and vector.
|
|
template<AccumOrOp Acc, Elem E> |
auto | add (const Acc &acc, E a) -> result_type_t< Acc > |
| Returns an accumulator with the addition of a value to all the elements of the input vector.
|
|
template<AccumOrOp Acc1, AccumOrOp Acc2>
requires (arch::is(arch::AIE_ML) && is_same_accum_v<result_type_t<Acc1>, result_type_t<Acc2>>) |
auto | add (const Acc1 &acc1, const Acc2 &acc2) -> result_type_t< Acc1 > |
| Returns an accumulator with the element-wise addition of the two input accumulators.
|
|
template<Vector Vec, Elem E>
requires (is_valid_elem_op_v<typename Vec::value_type, E>) |
auto | add (const Vec &v, E a) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with the addition of a value to all the elements of the input vector.
|
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | add (const Vec1 &v1, const Vec2 &v2) -> aie_dm_resource_remove_t< Vec1 > |
| Returns a vector with the element-wise addition of the two input vectors.
|
|
template<Elem E, Vector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
auto | add (E a, const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with the addition of a value to all the elements of the input vector.
|
|
template<typename T >
requires (detail::is_floating_point_v<T>) |
T | add (T a, T b) |
|
template<Vector Vec> |
Vec::value_type | add_reduce (const Vec &v) |
|
template<Vector Vec, Vector... Others> |
auto | add_reduce_v (const Vec &v, const Others &... others) -> aie_dm_resource_remove_t< Vec > |
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin (adf::io_buffer< T, Dir, Config > &port) |
| Returns a foward iterator over given io buffer.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a foward const iterator over given io buffer.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | begin (T *base, size_t n) |
| Returns an iterator for the array described by the given address and size.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , unsigned Elems> |
constexpr auto | begin (T(&base)[Elems]) |
| Returns an iterator for the given statically-sized array.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_circular (adf::io_buffer< T, Dir, Config > &port) |
| Returns a foward circular iterator over given io buffer.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_circular (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a const foward circular iterator over given io buffer.
|
|
template<size_t Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | begin_circular (T *base) |
| Returns a circular iterator for the array described by the given address and size.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | begin_circular (T *base, size_t n) |
| Returns a circular iterator for the array described by the given address and size.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , size_t Elems> |
constexpr auto | begin_circular (T(&base)[Elems]) |
| Returns a circular iterator for the given statically-sized array.
|
|
template<unsigned Steps, typename T , typename... Offsets> |
constexpr auto | begin_pattern (T *base, Offsets &&... offsets) |
| Returns a forward iterator for the array described by the given address.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_random_circular (adf::io_buffer< T, Dir, Config > &port) |
| Returns a random iterator over given io buffer.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_random_circular (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a random const iterator over given io buffer.
|
|
template<size_t Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | begin_random_circular (T *base) |
| Returns a random-access circular iterator for the array described by the given address and size.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | begin_random_circular (T *base, size_t n) |
| Returns a random-access circular iterator for the array described by the given address and size.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , size_t Elems> |
constexpr auto | begin_random_circular (T(&base)[Elems]) |
| Returns a random-access circular iterator for the array described by the given address and size.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_restrict_vector (adf::io_buffer< T, Dir, Config > &port) |
| Returns a restrict vector iterator over given io buffer.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_restrict_vector (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a const restrict vector iterator over given io buffer.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
constexpr auto | begin_restrict_vector (const T *base) |
| Same as begin_vector, but the given pointer is considered restrict.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
constexpr auto | begin_restrict_vector (T *base) |
| Same as begin_vector, but the given pointer is considered restrict.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
constexpr auto | begin_unaligned_vector (T *base) |
| Returns a vector iterator starting at the given address.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_vector (adf::io_buffer< T, Dir, Config > &port) |
| Returns a vector iterator over given io buffer.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_vector (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a const vector iterator over given io buffer.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
constexpr auto | begin_vector (const T *base) |
| Returns a vector iterator starting at the given address.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
constexpr auto | begin_vector (T *base) |
| Returns a vector iterator starting at the given address.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_vector_circular (adf::io_buffer< T, Dir, Config > &port) |
| Returns a vector circular iterator over given io buffer.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_vector_circular (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a const vector circular iterator over given io buffer.
|
|
template<unsigned Elems, size_t ArrayElems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | begin_vector_circular (T *base) |
| Returns a circular iterator for the array described by the given address and size.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | begin_vector_circular (T *base, size_t n) |
| Returns a circular iterator for the array described by the given address and size.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , size_t ArrayElems> |
constexpr auto | begin_vector_circular (T(&base)[ArrayElems]) |
| Returns a circular iterator for the array described by the given address and size.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_vector_random_circular (adf::io_buffer< T, Dir, Config > &port) |
| Returns a vector random circular iterator over given io buffer.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | begin_vector_random_circular (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a const vector random circular iterator over given io buffer.
|
|
template<unsigned Elems, size_t ArrayElems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | begin_vector_random_circular (T *base) |
| Returns a circular iterator for the array described by the given address and size.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | begin_vector_random_circular (T *base, size_t n) |
| Returns a circular iterator for the array described by the given address and size.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , size_t ArrayElems> |
constexpr auto | begin_vector_random_circular (T(&base)[ArrayElems]) |
| Returns a circular iterator for the array described by the given address and size.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType... Types> |
constexpr auto | begin_vectors (Types *...ptrs) |
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2> && (!detail::is_complex_v<typename Vec1::value_type>) && (!detail::is_floating_point_v<typename Vec1::value_type>)) |
auto | bit_and (const Vec1 &v1, const Vec2 &v2) -> aie_dm_resource_remove_t< Vec1 > |
| Returns a vector with the bit-wise AND of the elements of the two input vectors.
|
|
template<Elem E, Vector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type> && (!detail::is_complex_v<typename Vec::value_type>) && (!detail::is_floating_point_v<typename Vec::value_type>)) |
auto | bit_and (E a, const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with the bit-wise AND of a value and all the elements of the input vector.
|
|
template<Vector Vec>
requires ((!detail::is_complex_v<typename Vec::value_type>) && (!detail::is_floating_point_v<typename Vec::value_type>)) |
auto | bit_not (const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with the bit-wise NEG of the elements of the input vector.
|
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2> && (!detail::is_complex_v<typename Vec1::value_type>) && (!detail::is_floating_point_v<typename Vec1::value_type>)) |
auto | bit_or (const Vec1 &v1, const Vec2 &v2) -> aie_dm_resource_remove_t< Vec1 > |
| Returns a vector with the bit-wise OR of the elements of the two input vectors.
|
|
template<Elem E, Vector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type> && (!detail::is_complex_v<typename Vec::value_type>) && (!detail::is_floating_point_v<typename Vec::value_type>)) |
auto | bit_or (E a, const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with the bit-wise OR of a value and all the elements of the input vector.
|
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2> && (!detail::is_complex_v<typename Vec1::value_type>) && (!detail::is_floating_point_v<typename Vec1::value_type>)) |
auto | bit_xor (const Vec1 &v1, const Vec2 &v2) -> aie_dm_resource_remove_t< Vec1 > |
| Returns a vector with the bit-wise XOR of the elements of the two input vectors.
|
|
template<Elem E, Vector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type> && (!detail::is_complex_v<typename Vec::value_type>) && (!detail::is_floating_point_v<typename Vec::value_type>)) |
auto | bit_xor (E a, const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with the bit-wise XOR of a value and all the elements of the input vector.
|
|
template<Elem E, unsigned Elems = native_vector_length_v<E>> |
vector< operand_base_type_t< E >, Elems > | broadcast (E a) |
| Returns a vector whose elements are initialized to the given value.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | cbegin (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a foward const iterator over given io buffer.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | cbegin (const T *base, size_t n) |
| Returns an iterator for the constant array described by the given address and size.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | cbegin_circular (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a const foward iterator over given io buffer.
|
|
template<size_t Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr const_circular_iterator< T, Elems, Resource > | cbegin_circular (const T *base) |
| Similar to begin_circular, but the returned iterator is constant.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr const_circular_iterator< T, dynamic_extent, Resource > | cbegin_circular (const T *base, size_t n) |
| Similar to begin_circular, but the returned iterator is constant.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , size_t Elems> |
constexpr const_circular_iterator< T, Elems, Resource > | cbegin_circular (const T(&base)[Elems]) |
| Similar to begin_circular, but the returned iterator is constant.
|
|
template<unsigned Steps, typename T , typename... Offsets> |
constexpr const_pattern_iterator< T, Steps > | cbegin_pattern (const T *base, Offsets &&... offsets) |
| Similar to begin_pattern, but the returned iterator is constant.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | cbegin_random_circular (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a random const iterator over given io buffer.
|
|
template<size_t Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | cbegin_random_circular (const T *base) |
| Similar to begin_random_circular, but the returned iterator is constant.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | cbegin_random_circular (const T *base, size_t n) |
| Similar to begin_random_circular, but the returned iterator is constant.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , size_t Elems> |
constexpr auto | cbegin_random_circular (const T(&base)[Elems]) |
| Similar to begin_random_circular, but the returned iterator is constant.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | cbegin_restrict_vector (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a const restrict vector iterator over given io buffer.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
constexpr auto | cbegin_restrict_vector (const T *base) |
| Same as begin_vector, but the given pointer is considered restrict.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
constexpr auto | cbegin_unaligned_vector (T *base) |
| Returns a vector iterator starting at the given address.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | cbegin_vector (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a const vector iterator over given io buffer.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
constexpr auto | cbegin_vector (const T *base) |
| Same as begin_vector.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | cbegin_vector_circular (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a const vector circular iterator over given io buffer.
|
|
template<unsigned Elems, size_t ArrayElems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | cbegin_vector_circular (const T *base) |
| Similar to begin_circular, but the returned iterator is constant.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | cbegin_vector_circular (const T *base, size_t n) |
| Similar to begin_circular, but the returned iterator is constant.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , size_t ArrayElems> |
constexpr auto | cbegin_vector_circular (const T(&base)[ArrayElems]) |
| Similar to begin_circular, but the returned iterator is constant.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , typename Dir , typename Config > |
constexpr auto | cbegin_vector_random_circular (const adf::io_buffer< T, Dir, Config > &port) |
| Returns a const vector random circular iterator over given io buffer.
|
|
template<unsigned Elems, size_t ArrayElems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | cbegin_vector_random_circular (const T *base) |
| Similar to begin_circular, but the returned iterator is constant.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | cbegin_vector_random_circular (const T *base, size_t n) |
| Similar to begin_circular, but the returned iterator is constant.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, typename T , size_t ArrayElems> |
constexpr auto | cbegin_vector_random_circular (const T(&base)[ArrayElems]) |
| Similar to begin_circular, but the returned iterator is constant.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType... Types> |
constexpr auto | cbegin_vectors (const Types *...ptrs) |
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | cend (const T *base, size_t n) |
| Returns an iterator that points at the end of the constant array described by the given address and size.
|
|
template<Accum Acc, Accum... Accums>
requires ((is_same_accum_v<Acc, Accums> && ...)) |
auto | concat (const Acc &acc, const Accums &...accums) -> accum< typename Acc::value_type, Acc::size() *(1+sizeof...(Accums))> |
| Concatenate the contents of all input accumulators into a larger accumulator.
|
|
template<Vector Vec, Vector... Vectors>
requires ((is_same_vector_v<Vec, Vectors> && ...)) |
auto | concat (const Vec &v, const Vectors &...vectors) -> vector< typename Vec::value_type, Vec::size() *(1+sizeof...(Vectors))> |
| Concatenate the contents of all input vectors into a larger vector.
|
|
template<ComplexElem E> |
constexpr auto | conj (const E &a) -> operand_base_type_t< E > |
| Compute the conjugate in the given complex value.
|
|
template<ComplexVector Vec> |
auto | conj (const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Compute the conjugate for each element in the given vector of complex elements.
|
|
template<Elem E, Vector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
bool | contains (E a, const Vec &v) |
|
template<RealVector Vec>
requires (arch::is(arch::AIE)) |
auto | cos (const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Performs a cosine operation on all elements in the input vector.
|
|
template<typename E >
requires (arch::is(arch::AIE) && (RealElem<E> || std::is_integral_v<E>)) |
auto | cos (E a) |
| Performs a cosine operation on a single value.
|
|
template<ComplexVector Vec, ComplexElem E>
requires (arch::is(arch::AIE) || (arch::is(arch::AIE_ML) && __AIE_API_COMPLEX_FP32_EMULATION__ == 1)) |
auto | div (const Vec &a, const E &b) -> accum< detail::accum_tag_for_mul_types< typename Vec::value_type, detail::utils::get_complex_component_type_t< E > >, Vec::size()> |
| Returns the quotients of the element-wise division of a complex vector 'a' by a complex scalar 'b'.
|
|
template<ComplexVector Vec>
requires (arch::is(arch::AIE) || (arch::is(arch::AIE_ML) && __AIE_API_COMPLEX_FP32_EMULATION__ == 1)) |
auto | div (const Vec &a, const Vec &b) -> accum< detail::accum_tag_for_mul_types< typename Vec::value_type, detail::utils::get_complex_component_type_t< typename Vec::value_type > >, Vec::size()> |
| Returns the quotients of the element-wise division of two complex vectors 'a' and 'b'.
|
|
template<Vector Vec, RealElem E>
requires ( detail::is_floating_point_v<typename Vec::value_type> && detail::is_valid_element_type_v<E> && detail::is_floating_point_v<E>) |
auto | div (const Vec &a, E b) -> accum< detail::accum_tag_for_mul_types< typename Vec::value_type, E >, Vec::size()> |
| Returns the quotients of the element-wise division of each value of the first input vector by a scalar.
|
|
template<Vector Vec1, RealVector Vec2>
requires (Vec1::size() == Vec2::size() && detail::is_floating_point_v<typename Vec2::value_type>) |
auto | div (const Vec1 &a, const Vec2 &b) -> accum< detail::accum_tag_for_mul_types< typename Vec1::value_type, typename Vec2::value_type >, Vec1::size()> |
| Returns the quotients of the element-wise division of each value of the first input vector by the corresponding element in the second input vector.
|
|
float | div (float a, float b) |
|
template<Vector Vec> |
constexpr auto | downshift (const Vec &v, unsigned shift) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with all values arithmetically downshifted by specified number of bits.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T > |
constexpr auto | end (T *base, size_t n) |
| Returns an iterator that points at the end of the array described by the given address and size.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , unsigned Elems> |
constexpr auto | end (T(&base)[Elems]) |
| Returns an iterator that points at the end of the given statically-sized array.
|
|
template<Vector Vec, Elem E>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | eq (const Vec &v, E a) |
| Compares a value with the elements of the input vector and returns a mask that says what elements in the vector are equal to the value.
|
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
mask< Vec1::size()> | eq (const Vec1 &v1, const Vec2 &v2) |
| Compares the elements of the two input vectors and returns a mask that says what elements are equal.
|
|
template<Elem E, Vector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | eq (E a, const Vec &v) |
| Compares a value with the elements of the input vector and returns a mask that says what elements in the vector are equal to the value.
|
|
template<typename T >
requires (detail::is_floating_point_v<T>) |
bool | eq (T a, T b) |
| Compares the two input values and returns whether they are equal.
|
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
constexpr bool | equal (const Vec1 &v1, const Vec2 &v2) |
| Return whether all the elements of the two input vectors are equal.
|
|
template<unsigned Vectorization, typename Input , typename Output , typename Twiddle >
requires (arch::is(arch::AIE) && detail::is_floating_point_v<Input>) |
void | fft_dit_r2_stage (const Input *__restrict x, const Twiddle *__restrict tw, unsigned n, bool inv, Output *__restrict out) |
| A function to perform a single floating point radix 2 FFT stage.
|
|
template<unsigned Vectorization, typename Input , typename Output , typename Twiddle > |
void | fft_dit_r2_stage (const Input *__restrict x, const Twiddle *__restrict tw, unsigned n, unsigned shift_tw, unsigned shift, bool inv, Output *__restrict out) |
| A function to perform a single radix 2 FFT stage.
|
|
template<unsigned Vectorization, typename Input , typename Output , typename Twiddle >
requires (arch::is(arch::AIE)) |
void | fft_dit_r3_stage (const Input *__restrict x, const Twiddle *__restrict tw0, const Twiddle *__restrict tw1, unsigned n, unsigned shift_tw, unsigned shift, bool inv, Output *__restrict out) |
| A function to perform a single radix 3 FFT stage.
|
|
template<unsigned Vectorization, typename Input , typename Output , typename Twiddle > |
void | fft_dit_r4_stage (const Input *__restrict x, const Twiddle *__restrict tw0, const Twiddle *__restrict tw1, const Twiddle *__restrict tw2, unsigned n, unsigned shift_tw, unsigned shift, bool inv, Output *__restrict out) |
| A function to perform a single radix 4 FFT stage.
|
|
template<unsigned Vectorization, typename Input , typename Output , typename Twiddle >
requires (arch::is(arch::AIE)) |
void | fft_dit_r5_stage (const Input *__restrict x, const Twiddle *__restrict tw0, const Twiddle *__restrict tw1, const Twiddle *__restrict tw2, const Twiddle *__restrict tw3, unsigned n, unsigned shift_tw, unsigned shift, bool inv, Output *out) |
| A function to perform a single radix 5 FFT stage.
|
|
template<Vector Vec> |
auto | filter_even (const Vec &v, unsigned step=1) -> vector< typename Vec::value_type, Vec::size()/2 > |
| Returns a vector of half the size whose contents follow the following pattern.
|
|
template<Vector Vec> |
auto | filter_odd (const Vec &v, unsigned step=1) -> vector< typename Vec::value_type, Vec::size()/2 > |
| Returns a vector of half the size whose contents follow the following pattern.
|
|
template<AccumElemBaseType AccumTag, VectorOrOp Vec> |
accum< AccumTag, Vec::size()> | from_vector (const Vec &v, int shift=0) |
| Returns the values of the passed vector in an accumulator of the requested type after applying the requested upshift operation.
|
|
template<RealVector Vec, RealElem E>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | ge (const Vec &v, E a) |
| Compares the elements of the input vector with a value and returns a mask that says if the elements in the vector are greater or equal than the value.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
mask< Vec1::size()> | ge (const Vec1 &v1, const Vec2 &v2) |
| Compares the elements of the two input vectors and returns a mask that says what elements from the first vector are greater or equal than the corresponding elements in the second vector.
|
|
template<RealElem E, RealVector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | ge (E a, const Vec &v) |
| Compares a value with the elements of the input vector and returns a mask that says if the value is greater or equal than the elements in the vector.
|
|
template<typename T >
requires (detail::is_floating_point_v<T> && !detail::is_complex_v<T>) |
bool | ge (T a, T b) |
| Compares the two input values and returns whether the first value is larger or equal than the second value.
|
|
template<RealVector Vec, RealElem E>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | gt (const Vec &v, E a) |
| Compares the elements of the input vector with a value and returns a mask that says if the elements in the vector are greater than the value.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
mask< Vec1::size()> | gt (const Vec1 &v1, const Vec2 &v2) |
| Compares the elements of the two input vectors and returns a mask that says what elements from the first vector are greater than the corresponding elements in the second vector.
|
|
template<RealElem E, RealVector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | gt (E a, const Vec &v) |
| Compares a value with the elements of the input vector and returns a mask that says if the value is greater than the elements in the vector.
|
|
template<typename T >
requires (detail::is_floating_point_v<T> && !detail::is_complex_v<T>) |
bool | gt (T a, T b) |
| Compares the two input values and returns whether the first value is larger than the second value.
|
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | interleave_butterfly (const Vec1 &v1, const Vec2 &v2, unsigned step) -> std::pair< aie_dm_resource_remove_t< Vec1 >, aie_dm_resource_remove_t< Vec1 > > |
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | interleave_butterfly_half (const Vec1 &v1, const Vec2 &v2, unsigned step) -> std::pair< aie_dm_resource_remove_t< Vec1 >, aie_dm_resource_remove_t< Vec1 > > |
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | interleave_crossover (const Vec1 &v1, const Vec2 &v2, unsigned step) -> std::pair< aie_dm_resource_remove_t< Vec1 >, aie_dm_resource_remove_t< Vec1 > > |
|
template<Vector Vec1, Vector Vec2, typename... Select>
requires (is_same_vector_v<Vec1, Vec2> && sizeof...(Select) == Vec1::size()) |
auto | interleave_custom (const Vec1 &v1, const Vec2 &v2, Select... select) -> std::pair< aie_dm_resource_remove_t< Vec1 >, aie_dm_resource_remove_t< Vec1 > > |
|
template<unsigned S0, unsigned S1, unsigned S2, unsigned S3, unsigned S4, unsigned S5, unsigned S6, unsigned S7, unsigned S8, unsigned S9, unsigned S10, unsigned S11, unsigned S12, unsigned S13, unsigned S14, unsigned S15, unsigned S16, unsigned S17, unsigned S18, unsigned S19, unsigned S20, unsigned S21, unsigned S22, unsigned S23, unsigned S24, unsigned S25, unsigned S26, unsigned S27, unsigned S28, unsigned S29, unsigned S30, unsigned S31, Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | interleave_custom_static (const Vec1 &v1, const Vec2 &v2) -> std::pair< aie_dm_resource_remove_t< Vec1 >, aie_dm_resource_remove_t< Vec1 > > |
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | interleave_unzip (const Vec1 &v1, const Vec2 &v2, unsigned step) -> std::pair< aie_dm_resource_remove_t< Vec1 >, aie_dm_resource_remove_t< Vec1 > > |
| Picks elements sequentially from the input vectors and writes them alternatively into the output vectors.
|
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | interleave_zip (const Vec1 &v1, const Vec2 &v2, unsigned step) -> std::pair< aie_dm_resource_remove_t< Vec1 >, aie_dm_resource_remove_t< Vec1 > > |
| Picks elements alternatively from the input vectors and writes them sequentially into the output vectors.
|
|
template<unsigned Elems>
requires (arch::is(arch::AIE)) |
accum< accfloat, Elems > | inv (const accum< accfloat, Elems > &v) |
|
template<Vector Vec> |
auto | inv (const Vec &v) -> aie_dm_resource_remove_t< Vec > |
|
template<RealElem E> |
auto | inv (E a) |
|
template<unsigned Elems>
requires (arch::is(arch::AIE)) |
accum< accfloat, Elems > | invsqrt (const accum< accfloat, Elems > &v) |
|
template<Vector Vec> |
auto | invsqrt (const Vec &v) -> aie_dm_resource_remove_t< Vec > |
|
template<Elem E> |
auto | invsqrt (E a) |
|
template<typename T , Elem E> |
constexpr bool | is_ct_elem_zero (E a) |
|
template<RealVector Vec, RealElem E>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | le (const Vec &v, E a) |
| Compares the elements of the input vector with a value and returns a mask that says if the elements in the vector are smaller or equal than the value.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
mask< Vec1::size()> | le (const Vec1 &v1, const Vec2 &v2) |
| Compares the elements of the two input vectors and returns a mask that says what elements from the first vector are smaller or equal than the corresponding elements in the second vector.
|
|
template<RealElem E, RealVector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | le (E a, const Vec &v) |
| Compares a value with the elements of the input vector and returns a mask that says if the value is smaller or equal than the elements in the vector.
|
|
template<typename T >
requires (detail::is_floating_point_v<T> && !detail::is_complex_v<T>) |
bool | le (T a, T b) |
| Compares the two input values and returns whether the first value is smaller or equal than the second value.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
auto | load_floor_bytes_v (const T *ptr, size_t bytes) -> vector< aie_dm_resource_remove_t< T >, Elems > |
| Load a vector of Elems size whose elements have type T.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
auto | load_floor_v (const T *ptr, unsigned n=Elems) -> vector< aie_dm_resource_remove_t< T >, Elems > |
| Load a vector of Elems size whose elements have type T.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
auto | load_unaligned_v (const T *ptr, unsigned aligned_elems=1) -> vector< aie_dm_resource_remove_t< T >, Elems > |
| Load a vector of Elems size whose elements have type T.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
auto | load_unaligned_v (const T *ptr, unsigned aligned_elems=1) -> vector< aie_dm_resource_remove_t< T >, native_vector_length_v< T > > |
| Load a vector whose elements have type T.
|
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
auto | load_v (const T *ptr) -> vector< aie_dm_resource_remove_t< T >, Elems > |
| Load a vector of Elems size whose elements have type T.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
auto | load_v (const T *ptr) -> vector< aie_dm_resource_remove_t< T >, native_vector_length_v< T > > |
| Load a vector whose elements have type T.
|
|
template<Vector Vec> |
constexpr auto | logical_downshift (const Vec &v, unsigned shift) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with all values logically downshifted by specified number of bits.
|
|
template<RealVector Vec, RealElem E>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | lt (const Vec &v, E a) |
| Compares the elements of the input vector with a value and returns a mask that says if the elements in the vector are smaller than the value.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
mask< Vec1::size()> | lt (const Vec1 &v1, const Vec2 &v2) |
| Compares the elements of the two input vectors and returns a mask that says what elements from the first vector are smaller than the corresponding elements in the second vector.
|
|
template<RealElem E, RealVector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | lt (E a, const Vec &v) |
| Compares a value with the elements of the input vector and returns a mask that says if the value is smaller than the elements in the vector.
|
|
template<typename T >
requires (detail::is_floating_point_v<T> && !detail::is_complex_v<T>) |
bool | lt (T a, T b) |
| Compares the two input values and returns whether the first value is smaller than the second value.
|
|
template<AccumOrOp Acc, VectorOrOp Vec, ElemOrOp E>
requires (is_valid_size_v<Acc, Vec, E> && is_valid_mul_op_v<typename Vec::value_type, E>) |
constexpr auto | mac (const Acc &acc, const Vec &v, E a) -> operand_base_type_t< Acc > |
| Returns an accumulator with the element-wise multiply-add of input vector, value and accumulator.
|
|
template<AccumOrOp Acc, VectorOrOp Vec1, VectorOrOp Vec2>
requires (is_valid_size_v<Acc, Vec1, Vec2> && is_valid_mul_op_v<typename Vec1::value_type, typename Vec2::value_type>) |
constexpr auto | mac (const Acc &acc, const Vec1 &v1, const Vec2 &v2) -> operand_base_type_t< Acc > |
| Returns an accumulator with the element-wise multiply-add of the two input vectors and accumulator.
|
|
template<AccumOrOp Acc, ElemOrOp E, VectorOrOp Vec>
requires (is_valid_size_v<Acc, E, Vec> && is_valid_mul_op_v<E, typename Vec::value_type>) |
constexpr auto | mac (const Acc &acc, E a, const Vec &v) -> operand_base_type_t< Acc > |
| Returns an accumulator with the element-wise multiply-add of value, input vector and accumulator.
|
|
template<typename TR , typename T1 , typename T2 >
requires (detail::is_floating_point_v<T1> && detail::is_floating_point_v<T2> && std::is_same_v<decltype(mul(a, b)), TR>) |
TR | mac (TR c, T1 a, T2 b) |
|
template<AccumOrOp Acc, Vector Vec>
requires (Vec::size() == Acc::size()) |
constexpr auto | mac_square (const Acc &acc, const Vec &v) |
| Returns an accumulator with the addition or subtraction of the given accumulator and the element-wise square of the input vector.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename TensorDescriptor > |
constexpr auto | make_restrict_tensor_buffer_stream (T *__restrict base, const TensorDescriptor &tensor_desc) |
|
template<aie_dm_resource Resource = aie_dm_resource::none, typename T , typename TensorDescriptor > |
constexpr auto | make_tensor_buffer_stream (T *base, const TensorDescriptor &tensor_desc) |
|
template<typename T , unsigned Elems, typename... Args>
requires (arch::is(arch::AIE_ML) && (std::is_same_v<Args, tensor_dim> && ...)) |
constexpr auto | make_tensor_descriptor (Args &&... args) |
|
template<typename T , unsigned Elems, typename... Args>
requires (arch::is(arch::AIE_ML) && (std::is_same_v<Args, tensor_dim> && ...)) |
constexpr auto | make_tensor_descriptor_bytes (Args &&... args) |
|
template<typename T , unsigned Elems, typename... Args> |
constexpr auto | make_tensor_descriptor_from_native (Args &&... args) |
|
template<typename T , unsigned Elems, typename... Args> |
constexpr auto | make_tensor_descriptor_from_native_bytes (Args &&... args) |
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
auto | make_unaligned_vector_input_buffer_stream (const T *ptr) -> unaligned_vector_input_buffer_stream< T, Elems, Resource > |
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
auto | make_unaligned_vector_output_buffer_stream (T *ptr) -> unaligned_vector_output_buffer_stream< T, Elems, Resource > |
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
auto | make_vector_input_buffer_stream (const T *ptr) -> vector_input_buffer_stream< T, Elems, Resource > |
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T> |
auto | make_vector_output_buffer_stream (T *ptr) -> vector_output_buffer_stream< T, Elems, Resource > |
|
template<RealVector Vec, RealElem E>
requires (is_valid_elem_op_v<typename Vec::value_type, E>) |
auto | max (const Vec &v, E a) -> aie_dm_resource_remove_t< Vec > |
| Compares the elements of the input vector with a value and returns a vector with the maximum values.
|
|
template<RealVector Vec, RealElem E>
requires (arch::is(arch::AIE_ML) && is_valid_elem_op_v<typename Vec::value_type, E>) |
auto | max (const Vec &v, E a, bool sign) -> aie_dm_resource_remove_t< Vec > |
| Compares the elements of the input vector with a value and returns a vector with the maximum values.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | max (const Vec1 &v1, const Vec2 &v2) -> aie_dm_resource_remove_t< Vec1 > |
| Compares the elements of the two input vectors and returns a vector with the maximum values.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (arch::is(arch::AIE_ML) && is_same_vector_v<Vec1, Vec2>) |
auto | max (const Vec1 &v1, const Vec2 &v2, bool sign) -> aie_dm_resource_remove_t< Vec1 > |
| Compares the elements of the two input vectors and returns a vector with the maximum values.
|
|
template<RealElem E, RealVector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
auto | max (E a, const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Compares a value with the elements of the input vector and returns a vector with the maximum values.
|
|
template<RealElem E, RealVector Vec>
requires (arch::is(arch::AIE_ML) && is_valid_elem_op_v<E, typename Vec::value_type>) |
auto | max (E a, const Vec &v, bool sign) -> aie_dm_resource_remove_t< Vec > |
| Compares a value with the elements of the input vector and returns a vector with the maximum values.
|
|
template<typename T >
requires (detail::is_floating_point_v<T>) |
T | max (T a, T b) |
| Compares the two input values and returns the maximum value.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | max_cmp (const Vec1 &v1, const Vec2 &v2) -> std::tuple< aie_dm_resource_remove_t< Vec1 >, mask< Vec1::size()> > |
|
template<RealVector Vec> |
Vec::value_type | max_reduce (const Vec &v) |
|
template<RealVector Vec, RealElem E>
requires (is_valid_elem_op_v<typename Vec::value_type, E>) |
auto | maxdiff (const Vec &v, E a) -> aie_dm_resource_remove_t< Vec > |
| Compares the elements of the input vector with a value and returns a vector whose values are their difference if it is positive, or zero otherwise.
|
|
template<RealVector Vec, RealElem E>
requires (arch::is(arch::AIE_ML) && is_valid_elem_op_v<typename Vec::value_type, E>) |
auto | maxdiff (const Vec &v, E a, bool sign) -> aie_dm_resource_remove_t< Vec > |
| Compares the elements of the input vector with a value and returns a vector whose values are their difference if it is positive, or zero otherwise.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | maxdiff (const Vec1 &v1, const Vec2 &v2) -> aie_dm_resource_remove_t< Vec1 > |
| Compares the elements of the two input vectors and returns a vector whose values are their difference if it is positive, or zero otherwise.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (arch::is(arch::AIE_ML) && is_same_vector_v<Vec1, Vec2>) |
auto | maxdiff (const Vec1 &v1, const Vec2 &v2, bool sign) -> aie_dm_resource_remove_t< Vec1 > |
| Compares the elements of the two input vectors and returns a vector whose values are their difference if it is positive, or zero otherwise.
|
|
template<RealElem E, RealVector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
auto | maxdiff (E a, const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Compares a value with the elements of the input vector and returns a vector whose values are their difference if it is positive, or zero otherwise.
|
|
template<RealElem E, RealVector Vec>
requires (arch::is(arch::AIE_ML) && is_valid_elem_op_v<E, typename Vec::value_type>) |
auto | maxdiff (E a, const Vec &v, bool sign) -> aie_dm_resource_remove_t< Vec > |
| Compares a value with the elements of the input vector and returns a vector whose values are their difference if it is positive, or zero otherwise.
|
|
template<RealVector Vec, RealElem E>
requires (is_valid_elem_op_v<typename Vec::value_type, E>) |
auto | min (const Vec &v, E a) -> aie_dm_resource_remove_t< Vec > |
| Compares the elements of the input vector with a value and returns a vector with the minimum values.
|
|
template<RealVector Vec, RealElem E>
requires (arch::is(arch::AIE_ML) && is_valid_elem_op_v<typename Vec::value_type, E>) |
auto | min (const Vec &v, E a, bool sign) -> aie_dm_resource_remove_t< Vec > |
| Compares the elements of the input vector with a value and returns a vector with the minimum values.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | min (const Vec1 &v1, const Vec2 &v2) -> aie_dm_resource_remove_t< Vec1 > |
| Compares the elements of the two input vectors and returns a vector with the minimum values.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (arch::is(arch::AIE_ML) && is_same_vector_v<Vec1, Vec2>) |
auto | min (const Vec1 &v1, const Vec2 &v2, bool sign) -> aie_dm_resource_remove_t< Vec1 > |
| Compares the elements of the two input vectors and returns a vector with the minimum values.
|
|
template<RealElem E, RealVector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
auto | min (E a, const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Compares a value with the elements of the input vector and returns a vector with the minimum values.
|
|
template<RealElem E, RealVector Vec>
requires (arch::is(arch::AIE_ML) && is_valid_elem_op_v<E, typename Vec::value_type>) |
auto | min (E a, const Vec &v, bool sign) -> aie_dm_resource_remove_t< Vec > |
| Compares a value with the elements of the input vector and returns a vector with the minimum values.
|
|
template<typename T >
requires (detail::is_floating_point_v<T>) |
T | min (T a, T b) |
| Compares the two input values and returns the minimum value.
|
|
template<RealVector Vec1, RealVector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | min_cmp (const Vec1 &v1, const Vec2 &v2) -> std::tuple< aie_dm_resource_remove_t< Vec1 >, mask< Vec1::size()> > |
|
template<RealVector Vec> |
Vec::value_type | min_reduce (const Vec &v) |
|
template<unsigned M, unsigned K, unsigned N, typename Acc , Vector VecA, Vector VecB>
requires ((Acc::accum_type::size() == M * N) && (VecA::size() == M * K) && (VecB::size() == K * N) && is_valid_mul_op_v<typename VecA::value_type, typename VecB::value_type> && is_mmul_v<Acc>) |
auto | mmac_fn (Acc &c, const VecA &a, const VecB &b) |
|
template<unsigned M, unsigned K, unsigned N, Accum Acc, Vector VecA, Vector VecB>
requires ((Acc::size() == M * N) && (VecA::size() == M * K) && (VecB::size() == K * N) && is_valid_mul_op_v<typename VecA::value_type, typename VecB::value_type>) |
auto | mmac_fn (const Acc &c, const VecA &a, const VecB &b) |
|
template<unsigned M, unsigned K, unsigned N, AccumElemBaseType AccumTag = accauto, Vector VecA, Vector VecB>
requires ((VecA::size() == M * K) && (VecB::size() == K * N) && is_valid_mul_op_v<typename VecA::value_type, typename VecB::value_type>) |
auto | mmul_fn (const VecA &a, const VecB &b) |
|
template<Accum Acc, VectorOrOp Vec, ElemOrOp E>
requires (is_valid_size_v<Acc, Vec, E> && is_valid_mul_op_v<typename Vec::value_type, E>) |
constexpr auto | msc (const Acc &acc, const Vec &v, E a) -> aie_dm_resource_remove_t< Acc > |
| Returns an accumulator with the element-wise multiply-add of input vector, value and accumulator.
|
|
template<Accum Acc, VectorOrOp Vec1, VectorOrOp Vec2>
requires (is_valid_size_v<Acc, Vec1, Vec2> && is_valid_mul_op_v<typename Vec1::value_type, typename Vec2::value_type>) |
constexpr auto | msc (const Acc &acc, const Vec1 &v1, const Vec2 &v2) -> aie_dm_resource_remove_t< Acc > |
| Returns an accumulator with the element-wise multiply-add of the two input vectors and accumulator.
|
|
template<Accum Acc, ElemOrOp E, VectorOrOp Vec>
requires (is_valid_size_v<Acc, E, Vec> && is_valid_mul_op_v<E, typename Vec::value_type>) |
constexpr auto | msc (const Acc &acc, E a, const Vec &v) -> aie_dm_resource_remove_t< Acc > |
| Returns an accumulator with the element-wise multiply-add of value, input vector and accumulator.
|
|
template<typename TR , typename T1 , typename T2 >
requires (detail::is_floating_point_v<T1> && detail::is_floating_point_v<T2> && std::is_same_v<decltype(mul(a, b)), TR>) |
TR | msc (TR c, T1 a, T2 b) |
|
template<Accum Acc, Vector Vec>
requires (Vec::size() == Acc::size()) |
constexpr auto | msc_square (const Acc &acc, const Vec &v) |
| Returns an accumulator with the subtraction of the given accumulator and the element-wise square of the input vector.
|
|
template<VectorOrOp Vec, ElemOrOp E>
requires (is_valid_size_v<E, Vec> && is_valid_mul_op_v<typename Vec::value_type, E>) |
constexpr auto | mul (const Vec &v, E a) |
| Returns an accumulator with the element-wise multiplication of a value and all the elements of a vector.
|
|
template<AccumElemBaseType AccumTag, VectorOrOp Vec, ElemOrOp E>
requires (is_valid_size_v<Vec, E> && is_valid_mul_op_v<typename Vec::value_type, E>) |
constexpr auto | mul (const Vec &v, E a) -> accum< AccumTag, Vec::size()> |
| Returns an accumulator of the requested type with the element-wise multiplication of a value and all the elements of the input vector.
|
|
template<VectorOrOp Vec1, VectorOrOp Vec2>
requires (is_valid_size_v<Vec1, Vec2> && is_valid_mul_op_v<typename Vec1::value_type, typename Vec2::value_type>) |
constexpr auto | mul (const Vec1 &v1, const Vec2 &v2) |
| Returns an accumulator with the element-wise multiplication of the two input vectors.
|
|
template<AccumElemBaseType AccumTag, VectorOrOp Vec1, VectorOrOp Vec2>
requires (is_valid_size_v<Vec1, Vec2> && is_valid_mul_op_v<typename Vec1::value_type, typename Vec2::value_type>) |
constexpr auto | mul (const Vec1 &v1, const Vec2 &v2) -> accum< AccumTag, Vec1::size()> |
| Returns an accumulator of the requested type with the element-wise multiplication of the two input vectors.
|
|
template<ElemOrOp E, VectorOrOp Vec>
requires (is_valid_size_v<E, Vec> && is_valid_mul_op_v<E, typename Vec::value_type>) |
constexpr auto | mul (E a, const Vec &v) |
| Returns an accumulator with the element-wise multiplication of a value and all the elements of a vector.
|
|
template<AccumElemBaseType AccumTag, ElemOrOp E, VectorOrOp Vec>
requires (is_valid_size_v<Vec, E> && is_valid_mul_op_v<E, typename Vec::value_type>) |
constexpr auto | mul (E a, const Vec &v) -> accum< AccumTag, Vec::size()> |
| Returns an accumulator of the requested type with the element-wise multiplication of a value and all the elements of the input vector.
|
|
template<typename T1 , typename T2 >
requires (detail::is_floating_point_v<T1> && detail::is_floating_point_v<T2>) |
auto | mul (T1 a, T2 b) |
|
template<AccumElemBaseType AccumTag, Vector Vec> |
Vec::value_type | mul_reduce (const Vec &v) |
|
template<Vector Vec> |
constexpr Vec::value_type | mul_reduce (const Vec &v) |
|
template<Vector Vec> |
constexpr auto | mul_square (const Vec &v) |
| Returns an accumulator with the element-wise square of the input vector.
|
|
template<AccumElemBaseType AccumTag, Vector Vec> |
constexpr auto | mul_square (const Vec &v) -> accum< AccumTag, Vec::size()> |
| Returns an accumulator of the requested type with the element-wise square of the input vector.
|
|
template<Elem E> |
constexpr auto | neg (const E &a) -> operand_base_type_t< E > |
| For values with signed types, return the input value with the sign flipped.
|
|
template<Vector Vec> |
constexpr auto | neg (const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| For vectors with signed types, return a vector whose elements are the same as in the given vector but with the sign flipped.
|
|
template<VectorOrOp Vec, ElemOrOp E>
requires (is_valid_mul_op_v<typename Vec::value_type, E>) |
constexpr auto | negmul (const Vec &v, E a) |
| Returns an accumulator with the negate of the element-wise multiplication of all the elements of the input vector and a value.
|
|
template<AccumElemBaseType AccumTag, VectorOrOp Vec, ElemOrOp E>
requires (is_valid_mul_op_v<typename Vec::value_type, E>) |
constexpr auto | negmul (const Vec &v, E a) -> accum< AccumTag, Vec::size()> |
| Returns an accumulator of the requested type with the negate of the element-wise multiplication of all the elements of the input vector and a value.
|
|
template<VectorOrOp Vec1, VectorOrOp Vec2>
requires ((Vec1::size() == Vec2::size()) && is_valid_mul_op_v<typename Vec1::value_type, typename Vec2::value_type>) |
constexpr auto | negmul (const Vec1 &v1, const Vec2 &v2) |
| Returns an accumulator with the negate of the element-wise multiplication of the two input vectors.
|
|
template<AccumElemBaseType AccumTag, VectorOrOp Vec1, VectorOrOp Vec2>
requires (Vec1::size() == Vec2::size() && is_valid_mul_op_v<typename Vec1::value_type, typename Vec2::value_type>) |
constexpr auto | negmul (const Vec1 &v1, const Vec2 &v2) -> accum< AccumTag, Vec1::size()> |
| Returns an accumulator of the requested type with the negate of the element-wise multiplication of the two input vectors.
|
|
template<ElemOrOp E, VectorOrOp Vec>
requires (is_valid_mul_op_v<E, typename Vec::value_type>) |
constexpr auto | negmul (E a, const Vec &v) |
| Returns an accumulator with the negate of the element-wise multiplication of a value and all the elements of the input vector.
|
|
template<AccumElemBaseType AccumTag, ElemOrOp E, VectorOrOp Vec>
requires (is_valid_mul_op_v<E, typename Vec::value_type>) |
constexpr auto | negmul (E a, const Vec &v) -> accum< AccumTag, Vec::size()> |
| Returns an accumulator of the requested type with the negate of the element-wise multiplication of a value and all the elements of the input vector.
|
|
template<Vector Vec, Elem E>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | neq (const Vec &v, E a) |
| Compares a value with the elements of the input vector and returns a mask that says what elements in the vector are different than the value.
|
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
mask< Vec1::size()> | neq (const Vec1 &v1, const Vec2 &v2) |
| Compares the elements of the two input vectors and returns a mask that says what elements are different.
|
|
template<Elem E, Vector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
mask< Vec::size()> | neq (E a, const Vec &v) |
| Compares a value with the elements of the input vector and returns a mask that says what elements in the vector are different than the value.
|
|
template<typename T >
requires (detail::is_floating_point_v<T>) |
bool | neq (T a, T b) |
| Compares the two input values and returns whether they are not equal.
|
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
constexpr bool | not_equal (const Vec1 &v1, const Vec2 &v2) |
| Return whether some elements in the two input vectors are not equal.
|
|
template<typename T >
requires (RealVector<T> || RealElem<T> || is_real_op_v<T>) |
constexpr unary_op< T, Operation::Abs > | op_abs (const T &e) |
| Returns an absolute operation modifier for the given vector or element.
|
|
template<Accum Acc> |
constexpr unary_op< Acc, Operation::Acc_Add > | op_add (const Acc &acc) |
| Returns an addition operation modifier for the given accumulator.
|
|
template<typename T >
requires (ComplexVector<T> || ComplexElem<T> || is_complex_op_v<T>) |
constexpr unary_op< T, Operation::Conj > | op_conj (const T &e) |
| Returns a conjugate operation modifier for the given complex vector or element.
|
|
template<VectorOrOp Vec1, VectorOrOp Vec2> |
constexpr binary_op< Vec1, Vec2, Operation::Max > | op_max (const Vec1 &a, const Vec2 &b) |
| Returns a maximum operation modifier for the given pair of vectors or elements.
|
|
template<VectorOrOp Vec1, VectorOrOp Vec2> |
constexpr binary_op< Vec1, Vec2, Operation::Min > | op_min (const Vec1 &a, const Vec2 &b) |
| Returns a minimum operation modifier for the given pair of vectors or elements.
|
|
template<typename T >
requires (Vector<T> || Elem<T> || Accum<T>) |
constexpr unary_op< T, Operation::None > | op_none (const T &e) |
| Returns an empty operation modifier for the given vector, vector element or accumulator.
|
|
template<typename T >
requires ((Vector<T> || Elem<T> || Accum<T> || is_op_v<T>) && (!detail::is_complex_v<typename T::value_type>) && (!detail::is_floating_point_v<typename T::value_type>)) |
constexpr binary_op< T, bool, Operation::Sign > | op_sign (const T &e, bool is_signed) |
| Returns dynamically signed/unsigned operation modifier for the vector or element, based on the boolean parameter.
|
|
template<Accum Acc> |
constexpr unary_op< Acc, Operation::Acc_Sub > | op_sub (const Acc &acc) |
| Returns a subtraction operation modifier for the given accumulator.
|
|
template<Accum Acc> |
constexpr binary_op< Acc, bool, Operation::Zero > | op_zero (const Acc &acc, bool to_zero) |
| Zeroes out the given accumulator or not depending on the zero parameter.
|
|
template<typename T1 , typename T2 >
requires (detail::is_vector_elem_ref_v<T1> || detail::is_vector_elem_ref_v<T2>) |
constexpr auto | operator& (T1 v1, T2 v2) |
|
template<typename T1 , typename T2 >
requires (detail::is_vector_elem_ref_v<T1> || detail::is_vector_elem_ref_v<T2>) |
constexpr auto | operator+ (T1 v1, T2 v2) |
|
template<typename T1 , typename T2 >
requires (detail::is_vector_elem_ref_v<T1> || detail::is_vector_elem_ref_v<T2>) |
constexpr auto | operator- (T1 v1, T2 v2) |
|
template<typename T >
requires (detail::is_vector_elem_ref_v<T>) |
constexpr auto | operator<< (T v, int n) -> typename T::value_type |
|
template<typename T >
requires (detail::is_vector_elem_ref_v<T>) |
constexpr auto | operator<< (T v, unsigned n) -> typename T::value_type |
|
template<typename T >
requires (detail::is_vector_elem_ref_v<T>) |
constexpr auto | operator>> (T v, int n) -> typename T::value_type |
|
template<typename T >
requires (detail::is_vector_elem_ref_v<T>) |
constexpr auto | operator>> (T v, unsigned n) -> typename T::value_type |
|
template<typename T1 , typename T2 >
requires (detail::is_vector_elem_ref_v<T1> || detail::is_vector_elem_ref_v<T2>) |
constexpr auto | operator^ (T1 v1, T2 v2) |
|
template<typename T1 , typename T2 >
requires (detail::is_vector_elem_ref_v<T1> || detail::is_vector_elem_ref_v<T2>) |
constexpr auto | operator| (T1 v1, T2 v2) |
|
template<typename T >
requires (detail::is_vector_elem_ref_v<T>) |
constexpr auto | operator~ (T v) |
|
template<VectorOrOp Vec, typename T2 = Utils::get_prev_integer_type_t<typename Vec::value_type>> |
auto | pack (const Vec &v) -> vector< T2, Vec::size()> |
| Returns a conversion of the passed vector to the next smaller integer datatype, with the same number of elements.
|
|
template<unsigned N> |
void | print (const aie::mask< N > &m, bool nl=false, const char *prefix=nullptr) |
| Displays the contents of a mask.
|
|
template<typename C >
requires (Vector<C> || Accum<C>) |
void | print (const C &c, bool nl=false, const char *prefix=nullptr) |
| Displays the contents of a vector or an accumulator.
|
|
template<typename T , unsigned Elems>
requires (!detail::is_floating_point_v<T>) |
void | print_fixed (const aie::vector< T, Elems > &v, int scale, bool nl=false, const char *prefix=nullptr) |
| Displays the contents of a vector integers represented as real numbers in fixed point.
|
|
template<typename Matrix >
requires (Vector<Matrix> || Accum<Matrix>) |
void | print_matrix (const Matrix &m, unsigned cols, const char *prefix=nullptr) |
| Displays the contents of a vector or accumulator, arranged in a matrix layout.
|
|
template<Vector Vec> |
Vec::value_type | reduce_add (const Vec &v) |
| Returns sum of the elements in the input vector.
|
|
template<Vector Vec, Vector... Others> |
auto | reduce_add_v (const Vec &v, const Others &... others) -> aie_dm_resource_remove_t< Vec > |
| Returns the sums of the elements in the input vectors.
|
|
template<RealVector Vec> |
Vec::value_type | reduce_max (const Vec &v) |
| Returns the element from the input vector with the largest value.
|
|
template<RealVector Vec> |
Vec::value_type | reduce_min (const Vec &v) |
| Returns the element from the input vector with the smallest value.
|
|
template<AccumElemBaseType AccumTag, Vector Vec> |
Vec::value_type | reduce_mul (const Vec &v) |
|
template<Vector Vec> |
constexpr Vec::value_type | reduce_mul (const Vec &v) |
|
template<Vector Vec> |
auto | reverse (const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector whose contents are the same as the input vector, but in reverse order.
|
|
template<Elem E1, Elem E2, Mask M>
requires (is_valid_elem_op_v<E1, E2>) |
vector< operand_base_type_t< E1 >, M::size()> | select (const E1 &a, const E2 &b, const M &m) |
| Combines the values of the input vector and value into a vector of the same size by using a mask that specifies which is the source input for each element of the output vector.
|
|
template<Vector Vec, Elem E, Mask M>
requires (is_valid_elem_op_v<E, typename Vec::value_type> && Vec::size() == M::size()) |
auto | select (const Vec &v, E a, const M &m) -> aie_dm_resource_remove_t< Vec > |
| Combines the values of the input vector and value into a vector of the same size by using a mask that specifies which is the source input for each element of the output vector.
|
|
template<Vector Vec1, Vector Vec2, Mask M>
requires (is_same_vector_v<Vec1, Vec2> && Vec1::size() == M::size()) |
auto | select (const Vec1 &v1, const Vec2 &v2, const M &m) -> aie_dm_resource_remove_t< Vec1 > |
| Combines the values of the two input vectors into a vector of the same size by using a mask that specifies which is the source input for each element of the output vector.
|
|
template<Elem E, Vector Vec, Mask M>
requires (is_valid_elem_op_v<E, typename Vec::value_type> && Vec::size() == M::size()) |
auto | select (E a, const Vec &v, const M &m) -> aie_dm_resource_remove_t< Vec > |
| Combines the values of the input value and vector into a vector of the same size by using a mask that specifies which is the source input for each element of the output vector.
|
|
template<Vector Vec> |
auto | shuffle_down (const Vec &v, unsigned n) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector whose contents are the same as the input vector, but shifted down by n.
|
|
template<Vector Vec> |
auto | shuffle_down_fill (const Vec &v, const Vec &fill, unsigned n) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector whose contents are the same as the input vector, but shifted down by n.
|
|
template<Vector Vec> |
auto | shuffle_down_replicate (const Vec &v, unsigned n) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector whose contents are the same as the input vector, but shifted down by n.
|
|
template<Vector Vec> |
auto | shuffle_down_rotate (const Vec &v, unsigned n) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector whose contents are the same as the input vector, but shifted down by n (elements wrap around):
|
|
template<Vector Vec> |
auto | shuffle_up (const Vec &v, unsigned n) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector whose contents are the same as the input vector, but shifted up by n.
|
|
template<Vector Vec> |
auto | shuffle_up_fill (const Vec &v, const Vec &fill, unsigned n) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector whose contents are the same as the input vector, but shifted up by n.
|
|
template<Vector Vec> |
auto | shuffle_up_replicate (const Vec &v, unsigned n) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector whose contents are the same as the input vector, but shifted up by n.
|
|
template<Vector Vec> |
auto | shuffle_up_rotate (const Vec &v, unsigned n) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector whose contents are the same as the input vector, but shifted up by n (elements wrap around):
|
|
template<RealVector Vec>
requires (arch::is(arch::AIE)) |
auto | sin (const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Performs a sine operation on all elements in the input vector.
|
|
template<typename E >
requires (arch::is(arch::AIE) && (RealElem<E> || std::is_integral_v<E>)) |
auto | sin (E a) |
| Performs a sine operation on a single value.
|
|
template<RealVector Vec>
requires (arch::is(arch::AIE)) |
auto | sincos (const Vec &v) -> std::pair< aie_dm_resource_remove_t< Vec >, aie_dm_resource_remove_t< Vec > > |
| Same as sin and cos, but performs both operations and returns a std::pair of vectors of result values.
|
|
template<typename E >
requires (arch::is(arch::AIE) && (RealElem<E> || std::is_integral_v<E>)) |
auto | sincos (E a) |
| Performs both sin and cos, and returns both values as an std::pair (sin first, then cos).
|
|
template<RealVector Vec>
requires (arch::is(arch::AIE)) |
auto | sincos_complex (const Vec &v) -> vector< std::conditional_t< Vec::is_floating_point(), cfloat, cint16 >, Vec::size()> |
| Same as sincos, but returns both values as the real and imaginary parts in a vector of complex values (cos in the real part, sin in the imaginary).
|
|
template<typename E >
requires (arch::is(arch::AIE) && (RealElem<E> || std::is_integral_v<E>)) |
auto | sincos_complex (E a) -> std::conditional_t< detail::is_floating_point_v< operand_base_type_t< E > >, cfloat, cint16 > |
| Same as sincos, but returns both values as the real and imaginary parts of a complex number (cos in the real part, sin in the imaginary part).
|
|
template<unsigned Lanes, unsigned Points, int CoeffStart = 0, int CoeffStep = 1, int DataStep = 1, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac (const Acc &acc, const VecCoeff &coeff, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStart = 0, int CoeffStep = 1, int DataStep = 1, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_antisym (const Acc &acc, const VecCoeff &coeff, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStart = 0, int CoeffStep = 1, int DataStep = 1, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_antisym (const Acc &acc, const VecCoeff &coeff, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_antisym (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_antisym (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned ldata_start, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_antisym (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStep = 1, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_antisym_uct (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start, unsigned uct_shift) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStep = 1, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_antisym_uct (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start, unsigned uct_shift) |
|
template<unsigned Outputs, unsigned Channels, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE_ML) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Outputs * Channels)) |
auto | sliding_mac_ch (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStart = 0, int CoeffStep = 1, int DataStep = 1, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_sym (const Acc &acc, const VecCoeff &coeff, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStart = 0, int CoeffStep = 1, int DataStep = 1, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_sym (const Acc &acc, const VecCoeff &coeff, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_sym (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_sym (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned ldata_start, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_sym (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStep = 1, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_sym_uct (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start, unsigned uct_shift) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStep = 1, Accum Acc, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type> && (Acc::size() == Lanes)) |
auto | sliding_mac_sym_uct (const Acc &acc, const VecCoeff &coeff, unsigned coeff_start, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start, unsigned uct_shift) |
|
template<unsigned Lanes, unsigned Points, int CoeffStart = 0, int CoeffStep = 1, int DataStep = 1, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul (const VecCoeff &coeff, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul (const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStart = 0, int CoeffStep = 1, int DataStep = 1, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_antisym (const VecCoeff &coeff, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStart = 0, int CoeffStep = 1, int DataStep = 1, AccumElemBaseType AccumTag = accauto, typename VecCoeff , typename VecData >
requires (arch::is(arch::AIE) && VectorOrOp<VecCoeff> && VectorOrOp<VecData> && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_antisym (const VecCoeff &coeff, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_antisym (const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_antisym (const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned ldata_start, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_antisym (const VecCoeff &coeff, unsigned coeff_start, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStep = 1, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_antisym_uct (const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start, unsigned uct_shift) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStep = 1, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_antisym_uct (const VecCoeff &coeff, unsigned coeff_start, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start, unsigned uct_shift) |
|
template<unsigned Outputs, unsigned Channels, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE_ML) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_ch (const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStart = 0, int CoeffStep = 1, int DataStep = 1, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_sym (const VecCoeff &coeff, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStart = 0, int CoeffStep = 1, int DataStep = 1, AccumElemBaseType AccumTag = accauto, typename VecCoeff , typename VecData >
requires (arch::is(arch::AIE) && VectorOrOp<VecCoeff> && VectorOrOp<VecData> && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_sym (const VecCoeff &coeff, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_sym (const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_sym (const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned ldata_start, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStepX = 1, int DataStepY = DataStepX, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_sym (const VecCoeff &coeff, unsigned coeff_start, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStep = 1, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_sym_uct (const VecCoeff &coeff, unsigned coeff_start, const VecData &data, unsigned data_start, unsigned uct_shift) |
|
template<unsigned Lanes, unsigned Points, int CoeffStep = 1, int DataStep = 1, AccumElemBaseType AccumTag = accauto, VectorOrOp VecCoeff, VectorOrOp VecData>
requires (arch::is(arch::AIE) && is_valid_mul_op_v<typename VecCoeff::value_type, typename VecData::value_type>) |
auto | sliding_mul_sym_uct (const VecCoeff &coeff, unsigned coeff_start, const VecData &ldata, unsigned ldata_start, const VecData &rdata, unsigned rdata_start, unsigned uct_shift) |
|
template<unsigned Elems>
requires (arch::is(arch::AIE)) |
accum< accfloat, Elems > | sqrt (const accum< accfloat, Elems > &v) |
|
template<Vector Vec> |
auto | sqrt (const Vec &v) -> aie_dm_resource_remove_t< Vec > |
|
template<Elem E> |
auto | sqrt (E a) |
|
template<unsigned Elems, aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T1, ElemBaseType T2>
requires (std::is_same_v<T2, aie_dm_resource_remove_t<T1>>) |
T1 * | store_unaligned_v (T1 *ptr, const vector< T2, Elems > &v, unsigned aligned_elems=1) |
| Store a vector of Elems size whose elements have type T.
|
|
template<aie_dm_resource Resource = aie_dm_resource::none, DecoratedElemBaseType T1, ElemBaseType T2, unsigned Elems>
requires (std::is_same_v<aie_dm_resource_remove_t<T1>, aie_dm_resource_remove_t<T2>>) |
T1 * | store_v (T1 *ptr, const vector< T2, Elems > &v) |
| Store a vector of Elems size whose elements have type T.
|
|
template<AccumOrOp Acc, Vector Vec>
requires (Acc::size() == Vec::size()) |
constexpr auto | sub (const Acc &acc, const Vec &v) -> result_type_t< Acc > |
| Returns an accumulator with the element-wise subtraction of the input accumulator and vector.
|
|
template<AccumOrOp Acc, Elem E> |
auto | sub (const Acc &acc, E a) -> result_type_t< Acc > |
| Returns an accumulator with the subtraction of all the elements of the input accumulator and a value.
|
|
template<AccumOrOp Acc1, AccumOrOp Acc2>
requires (arch::is(arch::AIE_ML) && is_same_accum_v<result_type_t<Acc1>, result_type_t<Acc2>>) |
auto | sub (const Acc1 &acc1, const Acc2 &acc2) -> result_type_t< Acc1 > |
| Returns an accumulator with the element-wise subtraction of the two input accumulators.
|
|
template<Vector Vec, Elem E>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
auto | sub (const Vec &v, E a) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with the subtraction of the elements of the input vector and a value.
|
|
template<Vector Vec1, Vector Vec2>
requires (is_same_vector_v<Vec1, Vec2>) |
auto | sub (const Vec1 &v1, const Vec2 &v2) -> aie_dm_resource_remove_t< Vec1 > |
| Returns a vector with the element-wise subtraction of the two input vectors.
|
|
template<Elem E, Vector Vec>
requires (is_valid_elem_op_v<E, typename Vec::value_type>) |
auto | sub (E a, const Vec &v) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with the subtraction of a value and all the elements of the input vector.
|
|
template<typename T >
requires (detail::is_floating_point_v<T>) |
T | sub (T a, T b) |
|
template<typename T > |
| tlast (const T &, bool) -> tlast< const T &, bool > |
|
template<typename T > |
| tlast (T &, bool &) -> tlast< T &, bool & > |
|
template<typename TR = cint32>
requires (Utils::is_one_of_v<TR, cint16, cint32>) |
auto | to_fixed (cfloat a, int shift=0) |
| Convert a floating point value into a fixed-point value.
|
|
template<typename TR = int32, unsigned Elems>
requires (arch::is(arch::AIE_ML)) |
auto | to_fixed (const vector< bfloat16, Elems > &v, int shift=0) -> vector< TR, Elems > |
| Convert the elements in a bfloat16 vector into fixed-point values.
|
|
template<typename TR = cint32, unsigned Elems>
requires ((arch::is(arch::AIE) || (arch::is(arch::AIE_ML) && __AIE_API_COMPLEX_FP32_EMULATION__ == 1)) && Utils::is_one_of_v<TR, cint16, cint32>) |
auto | to_fixed (const vector< cfloat, Elems > &v, int shift=0) -> vector< TR, Elems > |
| Convert the elements in a floating point vector into fixed-point values.
|
|
template<typename TR = int32, unsigned Elems>
requires (Utils::is_one_of_v<TR, int16, int32>) |
auto | to_fixed (const vector< float, Elems > &v, int shift=0) -> vector< TR, Elems > |
| Convert the elements in a floating point vector into fixed-point values.
|
|
template<typename TR = int32>
requires (Utils::is_one_of_v<TR, int8, int16, int32>) |
auto | to_fixed (float a, int shift=0) |
| Convert a floating point value into a fixed-point value.
|
|
template<typename TR = float, typename T , unsigned Elems>
requires (Utils::is_one_of_v<T, int16, int32>) |
auto | to_float (const vector< T, Elems > &v, int shift=0) -> vector< TR, Elems > |
| Convert the elements in a real fixed-point vector into floating point values.
|
|
template<typename TR = cfloat, typename T , unsigned Elems>
requires (Utils::is_one_of_v<T, cint16, cint32>) |
auto | to_float (const vector< T, Elems > &v, int shift=0) -> vector< TR, Elems > |
| Convert the elements in a complex fixed-point vector into floating point values.
|
|
template<typename TR = float> |
auto | to_float (int a, int shift=0) |
| Convert a fixed-point value into a floating point value.
|
|
template<typename TR = cfloat, typename T >
requires (Utils::is_one_of_v<T, cint16, cint32>) |
auto | to_float (T a, int shift=0) |
| Convert a complex fixed-point value into a floating point value.
|
|
template<typename TR , typename T >
requires (AccumOrOp<T> || MmulOrOp<T>) |
vector< TR, T::size()> | to_vector (const T &acc, int shift=0) |
| Returns the values of the passed accumulator in a vector of the requested type.
|
|
template<Vector Vec> |
auto | transpose (const Vec &v, unsigned Row, unsigned Col) -> aie_dm_resource_remove_t< Vec > |
| The input vector is interpreted as a row-major matrix of the dimensions specified by Row and Col, the function returns a vector ordered as the transpose of the specified matrix.
|
|
template<VectorOrOp Vec, typename T2 = Utils::get_next_integer_type_t<typename Vec::value_type>>
requires (Utils::is_one_of_v<T2, int8, uint8, int16, uint16>) |
auto | unpack (const Vec &v) -> vector< T2, Vec::size()> |
| Returns a conversion of the passed vector to the next larger integer datatype, with the same number of elements.
|
|
template<Vector Vec> |
constexpr auto | upshift (const Vec &v, unsigned shift) -> aie_dm_resource_remove_t< Vec > |
| Returns a vector with all values upshifted by specified number of bits.
|
|
template<detail::NativeVectorType T> |
| vector (T) -> vector< typename detail::native_vector_traits< T >::value_type, detail::native_vector_traits< T >::elems > |
| Template deduction guidelines for aie::vector.
|
|
template<ElemBaseType DstT, Accum Acc>
requires (arch::is(arch::AIE_ML)) |
auto | vector_cast (const Acc &acc) |
| Reinterpret an accumulator as a vector.
|
|
template<ElemBaseType DstT, Vector Vec> |
auto | vector_cast (const Vec &v) |
| Reinterpret a vector using a different element type.
|
|
template<AccumElemBaseType DstTag, Vector Vec>
requires (arch::is(arch::AIE_ML)) |
auto | vector_cast (const Vec &v) |
| Reinterpret a vector as an accumulator.
|
|
template<ElemBaseType T> |
constexpr T | zero () |
| Returns the zero value for the requested data type.
|
|
template<ElemBaseType T, unsigned Elems = native_vector_length_v<T>> |
vector< T, Elems > | zeros () |
| Returns a vector whose elements are initialized to zero.
|
|
template<AccumElemBaseType AccumTag, unsigned Elems = native_vector_length_v<AccumTag>> |
accum< AccumTag, Elems > | zeros () |
| Returns a vector whose elements are initialized to zero.
|
|