build/html/base__simd_8h_source.html

#pragma once


#include <stdint.h>

#include <algorithm>

#include <cmath>

#include <complex>

#include <functional>


namespace mlx::core::simd {

template <typename T, int N>

struct Simd;


template <typename T>

static constexpr int max_size = 1;


template <typename T>


struct Simd<T, 1> {

  static constexpr int size = 1;

  T value;

  Simd() {}

  template <typename U>

  Simd(Simd<U, 1> v) : value(v.value) {}

  template <typename U>

  Simd(U v) : value(v) {}

};


template <typename T, int N>


Simd<T, N> load(const T* x) {

  return *(Simd<T, N>*)x;

}


template <typename T, int N>


void store(T* dst, Simd<T, N> x) {

  // Maintain invariant that bool is either 0 or 1 as

  // simd comparison ops set all bits in the result to 1

  if constexpr (std::is_same_v<T, bool> && N > 1) {

    x = x & 1;

  }

  *(Simd<T, N>*)dst = x;

}


template <typename, typename = void>

constexpr bool is_complex = false;


template <typename T>

constexpr bool is_complex<T, std::void_t<decltype(std::declval<T>().real())>> =

    true;


template <typename T>


Simd<T, 1> rint(Simd<T, 1> in) {

  if constexpr (is_complex<T>) {

    return Simd<T, 1>{

        T{std::rint(in.value.real()), std::rint(in.value.imag())}};

  } else {

    return Simd<T, 1>{std::rint(in.value)};

  }

}


template <typename T>


Simd<T, 1> rsqrt(Simd<T, 1> in) {

  return T(1.0) / sqrt(in);

}


template <typename T>


Simd<T, 1> recip(Simd<T, 1> in) {

  return T(1.0) / in;

}


#define DEFAULT_UNARY(name, op)    \

  template <typename T>            \

  Simd<T, 1> name(Simd<T, 1> in) { \

    return op(in.value);           \

  }


DEFAULT_UNARY(operator-, std::negate{})

DEFAULT_UNARY(operator!, std::logical_not{})

DEFAULT_UNARY(abs, std::abs)

DEFAULT_UNARY(acos, std::acos)

DEFAULT_UNARY(acosh, std::acosh)

DEFAULT_UNARY(asin, std::asin)

DEFAULT_UNARY(asinh, std::asinh)

DEFAULT_UNARY(atan, std::atan)

DEFAULT_UNARY(atanh, std::atanh)

DEFAULT_UNARY(ceil, std::ceil)

DEFAULT_UNARY(conj, std::conj)

DEFAULT_UNARY(cosh, std::cosh)

DEFAULT_UNARY(expm1, std::expm1)

DEFAULT_UNARY(floor, std::floor)

DEFAULT_UNARY(log, std::log)

DEFAULT_UNARY(log2, std::log2)

DEFAULT_UNARY(log10, std::log10)

DEFAULT_UNARY(log1p, std::log1p)

DEFAULT_UNARY(sinh, std::sinh)

DEFAULT_UNARY(sqrt, std::sqrt)

DEFAULT_UNARY(tan, std::tan)

DEFAULT_UNARY(tanh, std::tanh)


template <typename T>


Simd<T, 1> operator~(Simd<T, 1> in) {

  return ~in.value;

}


template <typename T>


auto real(Simd<T, 1> in) -> Simd<decltype(std::real(in.value)), 1> {

  return std::real(in.value);

}


template <typename T>


auto imag(Simd<T, 1> in) -> Simd<decltype(std::imag(in.value)), 1> {

  return std::imag(in.value);

}


template <typename T>


Simd<bool, 1> isnan(Simd<T, 1> in) {

  return std::isnan(in.value);

}


#define DEFAULT_BINARY(OP)                                                 \

  template <typename T1, typename T2>                                      \

  auto operator OP(Simd<T1, 1> a, Simd<T2, 1> b)                           \

      ->Simd<decltype(a.value OP b.value), 1> {                            \

    return a.value OP b.value;                                             \

  }                                                                        \

  template <typename T1, typename T2>                                      \

  auto operator OP(T1 a, Simd<T2, 1> b)->Simd<decltype(a OP b.value), 1> { \

    return a OP b.value;                                                   \

  }                                                                        \

  template <typename T1, typename T2>                                      \

  auto operator OP(Simd<T1, 1> a, T2 b)->Simd<decltype(a.value OP b), 1> { \

    return a.value OP b;                                                   \

  }


DEFAULT_BINARY(+)

DEFAULT_BINARY(-)

DEFAULT_BINARY(*)

DEFAULT_BINARY(/)

DEFAULT_BINARY(<<)

DEFAULT_BINARY(>>)

DEFAULT_BINARY(|)

DEFAULT_BINARY(^)

DEFAULT_BINARY(&)

DEFAULT_BINARY(&&)

DEFAULT_BINARY(||)


template <typename T>


Simd<T, 1> remainder(Simd<T, 1> a_, Simd<T, 1> b_) {

  T a = a_.value;

  T b = b_.value;

  T r;

  if constexpr (std::is_integral_v<T>) {

    r = a % b;

  } else {

    r = std::remainder(a, b);

  }

  if constexpr (std::is_signed_v<T>) {

    if (r != 0 && (r < 0 != b < 0)) {

      r += b;

    }

  }

  return r;

}


template <typename T>


Simd<T, 1> maximum(Simd<T, 1> a_, Simd<T, 1> b_) {

  T a = a_.value;

  T b = b_.value;

  if constexpr (!std::is_integral_v<T>) {

    if (std::isnan(a)) {

      return a;

    }

  }

  return (a > b) ? a : b;

}


template <typename T>


Simd<T, 1> minimum(Simd<T, 1> a_, Simd<T, 1> b_) {

  T a = a_.value;

  T b = b_.value;

  if constexpr (!std::is_integral_v<T>) {

    if (std::isnan(a)) {

      return a;

    }

  }

  return (a < b) ? a : b;

}


template <typename T>


Simd<T, 1> pow(Simd<T, 1> a, Simd<T, 1> b) {

  T base = a.value;

  T exp = b.value;

  if constexpr (!std::is_integral_v<T>) {

    return std::pow(base, exp);

  } else {

    T res = 1;

    while (exp) {

      if (exp & 1) {

        res *= base;

      }

      exp >>= 1;

      base *= base;

    }

    return res;

  }

}


template <typename T>


Simd<T, 1> atan2(Simd<T, 1> a, Simd<T, 1> b) {

  return std::atan2(a.value, b.value);

}


#define DEFAULT_COMPARISONS(OP)                             \

  template <typename T1, typename T2>                       \

  Simd<bool, 1> operator OP(Simd<T1, 1> a, Simd<T2, 1> b) { \

    return a.value OP b.value;                              \

  }                                                         \

  template <typename T1, typename T2>                       \

  Simd<bool, 1> operator OP(T1 a, Simd<T2, 1> b) {          \

    return a OP b.value;                                    \

  }                                                         \

  template <typename T1, typename T2>                       \

  Simd<bool, 1> operator OP(Simd<T1, 1> a, T2 b) {          \

    return a.value OP b;                                    \

  }


DEFAULT_COMPARISONS(>)

DEFAULT_COMPARISONS(<)


DEFAULT_COMPARISONS(>=)

DEFAULT_COMPARISONS(<=)


DEFAULT_COMPARISONS(==)

DEFAULT_COMPARISONS(!=)


template <typename MaskT, typename T>


Simd<T, 1> select(Simd<MaskT, 1> mask, Simd<T, 1> x, Simd<T, 1> y) {

  return mask.value ? x.value : y.value;

}


template <typename T>


Simd<T, 1> clamp(Simd<T, 1> v, Simd<T, 1> min, Simd<T, 1> max) {

  return std::clamp(v.value, min.value, max.value);

}


template <typename T, typename U>


Simd<T, 1> fma(Simd<T, 1> x, Simd<T, 1> y, U z) {

  return std::fma(x.value, y.value, Simd<T, 1>(z).value);

}


// Reductions


#define DEFAULT_REDUCTION(name, type) \

  template <typename T>               \

  type name(Simd<T, 1> x) {           \

    return x.value;                   \

  }


DEFAULT_REDUCTION(max, T)

DEFAULT_REDUCTION(min, T)

DEFAULT_REDUCTION(sum, T)

DEFAULT_REDUCTION(prod, T)

DEFAULT_REDUCTION(any, bool)

DEFAULT_REDUCTION(all, bool)


} // namespace mlx::core::simd

DEFAULT_REDUCTION
#define DEFAULT_REDUCTION(name, type)
Definition base_simd.h:246

DEFAULT_UNARY
#define DEFAULT_UNARY(name, op)
Definition base_simd.h:69

DEFAULT_BINARY
#define DEFAULT_BINARY(OP)
Definition base_simd.h:116

DEFAULT_COMPARISONS
#define DEFAULT_COMPARISONS(OP)
Definition base_simd.h:209

mlx::core::std
array std(const array &a, bool keepdims, int ddof=0, StreamOrDevice s={})
Computes the standard deviation of the elements of an array.

mlx::core::simd
Definition accelerate_fp16_simd.h:9

mlx::core::simd::isnan
Simd< bool, N > isnan(Simd< T, N > v)
Definition accelerate_simd.h:146

mlx::core::simd::sinh
Simd< float16_t, N > sinh(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:41

mlx::core::simd::N
constexpr int N
Definition neon_fp16_simd.h:9

mlx::core::simd::atanh
Simd< float16_t, N > atanh(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:34

mlx::core::simd::minimum
Simd< T, N > minimum(Simd< T, N > a, Simd< T, N > b)
Definition accelerate_simd.h:215

mlx::core::simd::pow
Simd< float16_t, N > pow(Simd< float16_t, N > x, Simd< float16_t, N > y)
Definition accelerate_fp16_simd.h:54

mlx::core::simd::atan2
Simd< float16_t, N > atan2(Simd< float16_t, N > x, Simd< float16_t, N > y)
Definition accelerate_fp16_simd.h:52

mlx::core::simd::prod
T prod(Simd< T, N > x)
Definition accelerate_simd.h:297

mlx::core::simd::log10
Simd< float16_t, N > log10(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:39

mlx::core::simd::rint
Simd< T, N > rint(Simd< T, N > v)
Definition accelerate_simd.h:127

mlx::core::simd::load
Simd< T, N > load(const T *x)
Definition base_simd.h:28

mlx::core::simd::tan
Simd< float16_t, N > tan(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:42

mlx::core::simd::abs
Simd< T, N > abs(Simd< T, N > v)
Definition accelerate_simd.h:112

mlx::core::simd::acosh
Simd< float16_t, N > acosh(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:30

mlx::core::simd::all
bool all(Simd< T, N > x)
Definition accelerate_simd.h:276

mlx::core::simd::sum
T sum(Simd< T, N > x)
Definition accelerate_simd.h:284

mlx::core::simd::is_complex
constexpr bool is_complex
Definition base_simd.h:43

mlx::core::simd::conj
Simd< T, 1 > conj(Simd< T, 1 > in)
Definition base_simd.h:85

mlx::core::simd::log2
Simd< float16_t, N > log2(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:38

mlx::core::simd::max
T max(Simd< T, N > x)
Definition accelerate_simd.h:288

mlx::core::simd::maximum
Simd< T, N > maximum(Simd< T, N > a, Simd< T, N > b)
Definition accelerate_simd.h:209

mlx::core::simd::exp
Simd< T, N > exp(Simd< T, N > in)
Compute exp(x) in an optimizer friendly way as follows:
Definition math.h:28

mlx::core::simd::log
Simd< float16_t, N > log(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:37

mlx::core::simd::floor
Simd< T, N > floor(Simd< T, N > v)
Definition accelerate_simd.h:113

mlx::core::simd::expm1
Simd< float16_t, N > expm1(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:36

mlx::core::simd::imag
auto imag(Simd< T, 1 > in) -> Simd< decltype(std::imag(in.value)), 1 >
Definition base_simd.h:108

mlx::core::simd::asin
Simd< float16_t, N > asin(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:31

mlx::core::simd::any
bool any(Simd< T, N > x)
Definition accelerate_simd.h:280

mlx::core::simd::fma
Simd< T, N > fma(Simd< T, N > x, Simd< T, N > y, U z)
Definition accelerate_simd.h:269

mlx::core::simd::tanh
Simd< float16_t, N > tanh(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:43

mlx::core::simd::atan
Simd< float16_t, N > atan(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:33

mlx::core::simd::asinh
Simd< float16_t, N > asinh(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:32

mlx::core::simd::remainder
Simd< float16_t, N > remainder(Simd< float16_t, N > x, Simd< float16_t, N > y)
Definition accelerate_fp16_simd.h:53

mlx::core::simd::max_size
static constexpr int max_size
Definition base_simd.h:14

mlx::core::simd::min
T min(Simd< T, N > x)
Definition accelerate_simd.h:292

mlx::core::simd::real
auto real(Simd< T, 1 > in) -> Simd< decltype(std::real(in.value)), 1 >
Definition base_simd.h:104

mlx::core::simd::log1p
Simd< float16_t, N > log1p(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:40

mlx::core::simd::ceil
Simd< T, N > ceil(Simd< T, N > v)
Definition accelerate_simd.h:120

mlx::core::simd::recip
Simd< T, N > recip(Simd< T, N > v)
Definition accelerate_simd.h:131

mlx::core::simd::sqrt
Simd< T, N > sqrt(Simd< T, N > v)
Definition accelerate_simd.h:129

mlx::core::simd::clamp
Simd< T, N > clamp(Simd< T, N > v, Simd< T, N > min, Simd< T, N > max)
Definition accelerate_simd.h:264

mlx::core::simd::acos
Simd< float16_t, N > acos(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:29

mlx::core::simd::rsqrt
Simd< T, N > rsqrt(Simd< T, N > v)
Definition accelerate_simd.h:130

mlx::core::simd::cosh
Simd< float16_t, N > cosh(Simd< float16_t, N > v)
Definition accelerate_fp16_simd.h:35

mlx::core::simd::store
void store(T *dst, Simd< T, N > x)
Definition base_simd.h:33

mlx::core::simd::select
Simd< T1, N > select(Simd< MaskT, N > mask, Simd< T1, N > x, Simd< T2, N > y)
Definition accelerate_simd.h:236

mlx::core::simd::Simd< T, 1 >::size
static constexpr int size
Definition base_simd.h:18

mlx::core::simd::Simd< T, 1 >::Simd
Simd()
Definition base_simd.h:20

mlx::core::simd::Simd< T, 1 >::Simd
Simd(Simd< U, 1 > v)
Definition base_simd.h:22

mlx::core::simd::Simd< T, 1 >::value
T value
Definition base_simd.h:19

mlx::core::simd::Simd< T, 1 >::Simd
Simd(U v)
Definition base_simd.h:24

mlx::core::simd::Simd
Definition accelerate_simd.h:55

mlx::core::simd::Simd::value
asd::Vector< scalar_t, N >::packed_t value
Definition accelerate_simd.h:80