argon/argon__half_8hpp_source.html

#pragma once

#include "vector.hpp"


#ifndef ARGON_PLATFORM_MVE

#ifdef __clang__

#define ace [[gnu::always_inline]] constexpr

#else

#define ace [[gnu::always_inline]] inline

#endif

template <typename ScalarType>

class ArgonHalf;


template <typename ScalarType>

  requires std::same_as<ScalarType, double> || std::same_as<ScalarType, uint64_t> || std::same_as<ScalarType, int64_t>


class ArgonHalf<ScalarType> : public argon::Vector<neon::Vec64_t<ScalarType>> {

  using T = argon::Vector<neon::Vec64_t<ScalarType>>;


 public:

  using vector_type = neon::Vec64_t<ScalarType>;

  using lane_type = const argon::Lane<vector_type>;


  static_assert(neon::is_doubleword_v<vector_type>);


  static constexpr size_t bytes = 8;

  static constexpr size_t lanes = bytes / sizeof(ScalarType);


  using T::T;

  ace ArgonHalf(argon::Vector<vector_type> vec) : T{std::move(vec)} {};

  ace ArgonHalf(const ArgonHalf&) = default;

  ace ArgonHalf(ArgonHalf&&) = default;

  ace ArgonHalf& operator=(const ArgonHalf&) = default;

  ace ArgonHalf& operator=(ArgonHalf&&) = default;


  ace static ArgonHalf<ScalarType> Create(uint64_t a) { return neon::create<vector_type>(a); }


  template <typename NewScalarType>


  ace ArgonHalf<NewScalarType> As() const {

    return neon::reinterpret<neon::Vec64_t<NewScalarType>>(this->vec_);

  }


  ace ArgonHalf<ScalarType> TableLookup(ArgonHalf<ScalarType> idx) { return neon::table_lookup1(this->vec_, idx); }

  ace ArgonHalf<ScalarType> TableExtension(ArgonHalf<ScalarType> b, ArgonHalf<ScalarType> idx) {

    return neon::table_extension1(this->vec_, b, idx);

  }


  template <size_t NumTables>

  ace ArgonHalf<ScalarType> TableExtension(std::array<ArgonHalf<ScalarType>, NumTables> b, ArgonHalf<ScalarType> idx) {

    return TableExtension<NumTables>((vector_type*)b.data(), idx);

  }


  template <size_t NumTables>

  ace ArgonHalf<ScalarType> TableExtension(vector_type* b, ArgonHalf<ScalarType> idx) {

    static_assert(NumTables > 1 && NumTables < 5, "Table Extension can only be performed with 1, 2, 3, or 4 tables");


    using multivec_type = neon::MultiVector_t<vector_type, NumTables>;


    multivec_type multivector = *(multivec_type*)b;


    if constexpr (NumTables == 2) {

      return neon::table_extension2(this->vec_, multivector, idx);

    } else if constexpr (NumTables == 3) {

      return neon::table_extension3(this->vec_, multivector, idx);

    } else if constexpr (NumTables == 4) {

      return neon::table_extension4(this->vec_, multivector, idx);

    }

  }


  template <typename U>

  ace ArgonHalf<U> ConvertTo() {

    return neon::convert<typename neon::Vec64<U>::type>(this->vec_);

  }

  template <typename U, int fracbits>

    requires(std::is_same_v<U, uint32_t> || std::is_same_v<U, int32_t> || std::is_same_v<U, float>)

  ace ArgonHalf<U> ConvertTo() {

    if constexpr (std::is_same_v<U, float>) {

      return neon::convert_n<fracbits>(this->vec_);

    } else if constexpr (std::is_unsigned_v<U>) {

      return neon::convert_n_unsigned<fracbits>(this->vec_);

    } else if constexpr (std::is_signed_v<U>) {

      return neon::convert_n_signed<fracbits>(this->vec_);

    }

  }


  ace Argon<ScalarType> CombineWith(ArgonHalf<ScalarType> high) const { return neon::combine(this->vec_, high); }


  ace ArgonHalf<ScalarType> Reverse() const { return this->Reverse64bit(); }

};


template <argon::helpers::has_larger ScalarType>

class ArgonHalf<ScalarType> : public argon::Vector<neon::Vec64_t<ScalarType>> {

  using T = argon::Vector<neon::Vec64_t<ScalarType>>;

  using next_larger = typename argon::helpers::NextLarger_t<ScalarType>;

  using argon_next_larger = Argon<next_larger>;


 public:

  using vector_type = neon::Vec64_t<ScalarType>;

  using lane_type = const argon::Lane<vector_type>;


  static_assert(neon::is_doubleword_v<vector_type>);


  static constexpr size_t bytes = 8;

  static constexpr size_t lanes = bytes / sizeof(ScalarType);


  using T::T;


  ace static ArgonHalf<ScalarType> Create(uint64_t a) { return neon::create<vector_type>(a); }


  template <typename NewScalarType>


  ace ArgonHalf<NewScalarType> As() const {

    return neon::reinterpret<neon::Vec64_t<NewScalarType>>(this->vec_);

  }


  ace argon_next_larger AddLong(ArgonHalf<ScalarType> b) const { return neon::add_long(this->vec_, b); }


  ace argon_next_larger MultiplyLong(ArgonHalf<ScalarType> b) const { return neon::multiply_long(this->vec_, b); }


  ace argon_next_larger MultiplyLong(ScalarType b) const { return neon::multiply_long(this->vec_, b); }


  ace argon_next_larger MultiplyLong(lane_type b) const {

    return neon::multiply_long_lane(this->vec_, b.vec(), b.lane());

  }


  ace argon_next_larger MultiplyAddLong(ArgonHalf<ScalarType> b) const {

    return neon::multiply_add_long(this->vec_, b);

  }


  ace argon_next_larger MultiplyAddLong(ScalarType b) const { return neon::multiply_add_long(this->vec_, b); }


  ace argon_next_larger MultiplyAddLong(lane_type b) const {

    return neon::multiply_add_long_lane(this->vec_, b.vec(), b.lane());

  }


  ace argon_next_larger MultiplyDoubleSaturateLong(ArgonHalf<ScalarType> b) const

    requires(std::is_same_v<vector_type, int16x4_t> || std::is_same_v<vector_type, int32x2_t>)

  {

    return neon::multiply_double_saturate_long(this->vec_, b);

  }


  ace argon_next_larger MultiplyDoubleSaturateLong(ScalarType b) const

    requires(std::is_same_v<vector_type, int16x4_t> || std::is_same_v<vector_type, int32x2_t>)

  {

    return neon::multiply_double_saturate_long(this->vec_, b);

  }


  ace argon_next_larger MultiplyDoubleSaturateLong(lane_type b) const

    requires(std::is_same_v<vector_type, int16x4_t> || std::is_same_v<vector_type, int32x2_t>)

  {

    return neon::multiply_double_saturate_long_lane(this->vec_, b.vec(), b.lane());

  }


  ace argon_next_larger MultiplyDoubleAddSaturateLong(ArgonHalf<ScalarType> b) const

    requires(std::is_same_v<vector_type, int16x4_t> || std::is_same_v<vector_type, int32x2_t>)

  {

    return neon::multiply_double_add_saturate_long(this->vec_, b);

  }


  ace argon_next_larger MultiplyDoubleAddSaturateLong(ScalarType b) const

    requires(std::is_same_v<vector_type, int16x4_t> || std::is_same_v<vector_type, int32x2_t>)

  {

    return neon::multiply_double_add_saturate_long(this->vec_, b);

  }


  ace argon_next_larger MultiplyDoubleAddSaturateLong(lane_type b) const

    requires(std::is_same_v<vector_type, int16x4_t> || std::is_same_v<vector_type, int32x2_t>)

  {

    return neon::multiply_double_add_saturate_long_lane(this->vec_, b.vec(), b.lane());

  }


  ace argon_next_larger SubtractLong(ArgonHalf<ScalarType> b) const { return neon::subtract_long(this->vec_, b); }


  ace argon_next_larger SubtractAbsoluteLong(ArgonHalf<ScalarType> b) const {

    return neon::subtract_absolute_long(this->vec_, b);

  }


  ace argon_next_larger PairwiseAddLong() const { return neon::pairwise_add_long(this->vec_); }


  ace argon_next_larger PairwiseAddLong(ArgonHalf<typename argon::helpers::NextSmaller<ScalarType>> b) const {

    return neon::pairwise_add_long(this->vec_, b);

  }


  ace argon_next_larger Widen() const { return neon::move_long(this->vec_); }


  template <size_t n>

  ace argon_next_larger ShiftLeftLong() {

    return neon::shift_left_long<n>(this->vec_);

  }


  ace ArgonHalf<ScalarType> TableLookup(ArgonHalf<ScalarType> idx) { return neon::table_lookup1(this->vec_, idx); }

  ace ArgonHalf<ScalarType> TableExtension(ArgonHalf<ScalarType> b, ArgonHalf<ScalarType> idx) {

    return neon::table_extension1(this->vec_, b, idx);

  }


  template <size_t NumTables>

  ace ArgonHalf<ScalarType> TableExtension(std::array<ArgonHalf<ScalarType>, NumTables> b, ArgonHalf<ScalarType> idx) {

    return TableExtension<NumTables>((vector_type*)b.data(), idx);

  }


  template <size_t NumTables>

  ace ArgonHalf<ScalarType> TableExtension(vector_type* b, ArgonHalf<ScalarType> idx) {

    static_assert(NumTables > 1 && NumTables < 5, "Table Extension can only be performed with 1, 2, 3, or 4 tables");


    using multivec_type = neon::MultiVector_t<vector_type, NumTables>;


    multivec_type multivector = *(multivec_type*)b;


    if constexpr (NumTables == 2) {

      return neon::table_extension2(this->vec_, multivector, idx);

    } else if constexpr (NumTables == 3) {

      return neon::table_extension3(this->vec_, multivector, idx);

    } else if constexpr (NumTables == 4) {

      return neon::table_extension4(this->vec_, multivector, idx);

    }

  }


  template <typename U>

  ace ArgonHalf<U> ConvertTo() {

    return neon::convert<typename neon::Vec64<U>::type>(this->vec_);

  }


  template <typename U, int fracbits>

    requires(std::is_same_v<U, uint32_t> || std::is_same_v<U, int32_t> || std::is_same_v<U, float>)

  ace ArgonHalf<U> ConvertTo() {

    if constexpr (std::is_same_v<U, float>) {

      return neon::convert_n<fracbits>(this->vec_);

    } else if constexpr (std::is_unsigned_v<U>) {

      return neon::convert_n_unsigned<fracbits>(this->vec_);

    } else if constexpr (std::is_signed_v<U>) {

      return neon::convert_n_signed<fracbits>(this->vec_);

    }

  }


  ace Argon<ScalarType> CombineWith(ArgonHalf<ScalarType> high) const { return neon::combine(this->vec_, high); }


  ace ArgonHalf<ScalarType> Reverse() const { return this->Reverse64bit(); }

};


template <class... ArgTypes>

  requires(sizeof...(ArgTypes) > 1)

ArgonHalf(ArgTypes...) -> ArgonHalf<std::tuple_element_t<0, std::tuple<ArgTypes...>>>;


template <typename V>

  requires std::is_scalar_v<V>

ace ArgonHalf<V> operator+(const V a, const ArgonHalf<V> b) {

  return b.Add(a);

}


template <typename V>

  requires std::is_scalar_v<V>

ace ArgonHalf<V> operator-(const V a, const ArgonHalf<V> b) {

  return ArgonHalf<V>{a}.Subtract(b);

}


template <typename V>

  requires std::is_scalar_v<V>

ace ArgonHalf<V> operator*(const V a, const ArgonHalf<V> b) {

  return b.Multiply(a);

}


template <typename V>

  requires std::is_scalar_v<V>

ace ArgonHalf<V> operator/(const V a, const ArgonHalf<V> b) {

  return ArgonHalf<V>{a}.Divide(b);

}


namespace std {

template <typename T>


struct tuple_size<ArgonHalf<T>> {

  static constexpr size_t value = ArgonHalf<T>::lanes;

};


template <size_t Index, typename T>


struct tuple_element<Index, ArgonHalf<T>> {

  static_assert(Index < ArgonHalf<T>::lanes);

  using type = argon::Lane<typename ArgonHalf<T>::vector_type>;

};


}  // namespace std

#endif

#undef ace

ArgonHalf< ScalarType >::Create
static ace ArgonHalf< ScalarType > Create(uint64_t a)
Create a new ArgonHalf from a raw 64-bit value.
Definition argon_half.hpp:36

ArgonHalf< ScalarType >::AddLong
ace argon_next_larger AddLong(ArgonHalf< ScalarType > b) const
Add, widening.
Definition argon_half.hpp:122

ArgonHalf< ScalarType >::As
ace ArgonHalf< NewScalarType > As() const
reinterpret an ArgonHalf to a different type
Definition argon_half.hpp:41

ArgonHalf
Definition argon_half.hpp:11

argon::Lane
Represents a single lane of a SIMD vector.
Definition lane.hpp:102

argon::Vector
Represents a SIMD vector with various operations.
Definition vector.hpp:50

argon::Vector< neon::Vec64_t< ScalarType > >::vec
constexpr neon::Vec64_t< ScalarType > vec() const
Definition vector.hpp:268

argon::helpers::NextLarger_t
NextLarger< T >::type NextLarger_t
Helper alias to get the next larger type for a given type.
Definition helpers.hpp:75

std
Lane deconstruction feature.
Definition argon_full.hpp:302