doxygen/____clang__hip__math_8h_source.html

/*===---- __clang_hip_math.h - Device-side HIP math support ----------------===

 *

 * Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 * See https://llvm.org/LICENSE.txt for license information.

 * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 *

 *===-----------------------------------------------------------------------===

 */

#ifndef __CLANG_HIP_MATH_H__

#define __CLANG_HIP_MATH_H__


#if !defined(__HIP__) && !defined(__OPENMP_AMDGCN__)

#error "This file is for HIP and OpenMP AMDGCN device compilation only."

#endif


// The __CLANG_GPU_DISABLE_MATH_WRAPPERS macro provides a way to let standard

// libcalls reach the link step instead of being eagerly replaced.

#ifndef __CLANG_GPU_DISABLE_MATH_WRAPPERS


#if !defined(__HIPCC_RTC__)

#include <limits.h>

#include <stdint.h>

#ifdef __OPENMP_AMDGCN__

#include <omp.h>

#endif

#endif // !defined(__HIPCC_RTC__)


#pragma push_macro("__DEVICE__")


#ifdef __OPENMP_AMDGCN__

#define __DEVICE__ static inline __attribute__((always_inline, nothrow))

#else

#define __DEVICE__ static __device__ inline __attribute__((always_inline))

#endif


// Device library provides fast low precision and slow full-recision

// implementations for some functions. Which one gets selected depends on

// __CLANG_GPU_APPROX_TRANSCENDENTALS__ which gets defined by clang if

// -ffast-math or -fgpu-approx-transcendentals are in effect.

#pragma push_macro("__FAST_OR_SLOW")

#if defined(__CLANG_GPU_APPROX_TRANSCENDENTALS__)

#define __FAST_OR_SLOW(fast, slow) fast

#else

#define __FAST_OR_SLOW(fast, slow) slow

#endif


// A few functions return bool type starting only in C++11.

#pragma push_macro("__RETURN_TYPE")

#ifdef __OPENMP_AMDGCN__

#define __RETURN_TYPE int

#else

#if defined(__cplusplus)

#define __RETURN_TYPE bool

#else

#define __RETURN_TYPE int

#endif

#endif // __OPENMP_AMDGCN__


#if defined (__cplusplus) && __cplusplus < 201103L

// emulate static_assert on type sizes

template<bool>

struct __compare_result{};

template<>

struct __compare_result<true> {

  static const __device__ bool valid;

};


__DEVICE__

void __suppress_unused_warning(bool b){};

template <unsigned int S, unsigned int T>

__DEVICE__ void __static_assert_equal_size() {

  __suppress_unused_warning(__compare_result<S == T>::valid);

}


#define __static_assert_type_size_equal(A, B) \

  __static_assert_equal_size<A,B>()


#else

#define __static_assert_type_size_equal(A,B) \

  static_assert((A) == (B), "")


#endif


__DEVICE__

uint64_t __make_mantissa_base8(const char *__tagp __attribute__((nonnull))) {

  uint64_t __r = 0;

  while (*__tagp != '\0') {

    char __tmp = *__tagp;


    if (__tmp >= '0' && __tmp <= '7')

      __r = (__r * 8u) + __tmp - '0';

    else

      return 0;


    ++__tagp;

  }


  return __r;

}


__DEVICE__

uint64_t __make_mantissa_base10(const char *__tagp __attribute__((nonnull))) {

  uint64_t __r = 0;

  while (*__tagp != '\0') {

    char __tmp = *__tagp;


    if (__tmp >= '0' && __tmp <= '9')

      __r = (__r * 10u) + __tmp - '0';

    else

      return 0;


    ++__tagp;

  }


  return __r;

}


__DEVICE__

uint64_t __make_mantissa_base16(const char *__tagp __attribute__((nonnull))) {

  uint64_t __r = 0;

  while (*__tagp != '\0') {

    char __tmp = *__tagp;


    if (__tmp >= '0' && __tmp <= '9')

      __r = (__r * 16u) + __tmp - '0';

    else if (__tmp >= 'a' && __tmp <= 'f')

      __r = (__r * 16u) + __tmp - 'a' + 10;

    else if (__tmp >= 'A' && __tmp <= 'F')

      __r = (__r * 16u) + __tmp - 'A' + 10;

    else

      return 0;


    ++__tagp;

  }


  return __r;

}


__DEVICE__

uint64_t __make_mantissa(const char *__tagp __attribute__((nonnull))) {

  if (*__tagp == '0') {

    ++__tagp;


    if (*__tagp == 'x' || *__tagp == 'X')

      return __make_mantissa_base16(__tagp);

    else

      return __make_mantissa_base8(__tagp);

  }


  return __make_mantissa_base10(__tagp);

}


// BEGIN FLOAT


// BEGIN INTRINSICS


__DEVICE__

float __cosf(float __x) { return __ocml_native_cos_f32(__x); }


__DEVICE__

float __exp10f(float __x) {

  const float __log2_10 = 0x1.a934f0p+1f;

  return __builtin_amdgcn_exp2f(__log2_10 * __x);

}


__DEVICE__

float __expf(float __x) {

  const float __log2_e = 0x1.715476p+0;

  return __builtin_amdgcn_exp2f(__log2_e * __x);

}


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

float __fadd_rd(float __x, float __y) { return __ocml_add_rtn_f32(__x, __y); }

__DEVICE__

float __fadd_rn(float __x, float __y) { return __ocml_add_rte_f32(__x, __y); }

__DEVICE__

float __fadd_ru(float __x, float __y) { return __ocml_add_rtp_f32(__x, __y); }

__DEVICE__

float __fadd_rz(float __x, float __y) { return __ocml_add_rtz_f32(__x, __y); }

#else

__DEVICE__

float __fadd_rn(float __x, float __y) { return __x + __y; }

#endif


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

float __fdiv_rd(float __x, float __y) { return __ocml_div_rtn_f32(__x, __y); }

__DEVICE__

float __fdiv_rn(float __x, float __y) { return __ocml_div_rte_f32(__x, __y); }

__DEVICE__

float __fdiv_ru(float __x, float __y) { return __ocml_div_rtp_f32(__x, __y); }

__DEVICE__

float __fdiv_rz(float __x, float __y) { return __ocml_div_rtz_f32(__x, __y); }

#else

__DEVICE__

float __fdiv_rn(float __x, float __y) { return __x / __y; }

#endif


__DEVICE__

float __fdividef(float __x, float __y) { return __x / __y; }


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

float __fmaf_rd(float __x, float __y, float __z) {

  return __ocml_fma_rtn_f32(__x, __y, __z);

}

__DEVICE__

float __fmaf_rn(float __x, float __y, float __z) {

  return __ocml_fma_rte_f32(__x, __y, __z);

}

__DEVICE__

float __fmaf_ru(float __x, float __y, float __z) {

  return __ocml_fma_rtp_f32(__x, __y, __z);

}

__DEVICE__

float __fmaf_rz(float __x, float __y, float __z) {

  return __ocml_fma_rtz_f32(__x, __y, __z);

}

#else

__DEVICE__

float __fmaf_rn(float __x, float __y, float __z) {

  return __builtin_fmaf(__x, __y, __z);

}

#endif


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

float __fmul_rd(float __x, float __y) { return __ocml_mul_rtn_f32(__x, __y); }

__DEVICE__

float __fmul_rn(float __x, float __y) { return __ocml_mul_rte_f32(__x, __y); }

__DEVICE__

float __fmul_ru(float __x, float __y) { return __ocml_mul_rtp_f32(__x, __y); }

__DEVICE__

float __fmul_rz(float __x, float __y) { return __ocml_mul_rtz_f32(__x, __y); }

#else

__DEVICE__

float __fmul_rn(float __x, float __y) { return __x * __y; }

#endif


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

float __frcp_rd(float __x) { return __ocml_div_rtn_f32(1.0f, __x); }

__DEVICE__

float __frcp_rn(float __x) { return __ocml_div_rte_f32(1.0f, __x); }

__DEVICE__

float __frcp_ru(float __x) { return __ocml_div_rtp_f32(1.0f, __x); }

__DEVICE__

float __frcp_rz(float __x) { return __ocml_div_rtz_f32(1.0f, __x); }

#else

__DEVICE__

float __frcp_rn(float __x) { return 1.0f / __x; }

#endif


__DEVICE__

float __frsqrt_rn(float __x) { return __builtin_amdgcn_rsqf(__x); }


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

float __fsqrt_rd(float __x) { return __ocml_sqrt_rtn_f32(__x); }

__DEVICE__

float __fsqrt_rn(float __x) { return __ocml_sqrt_rte_f32(__x); }

__DEVICE__

float __fsqrt_ru(float __x) { return __ocml_sqrt_rtp_f32(__x); }

__DEVICE__

float __fsqrt_rz(float __x) { return __ocml_sqrt_rtz_f32(__x); }

#else

__DEVICE__

float __fsqrt_rn(float __x) { return __ocml_native_sqrt_f32(__x); }

#endif


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

float __fsub_rd(float __x, float __y) { return __ocml_sub_rtn_f32(__x, __y); }

__DEVICE__

float __fsub_rn(float __x, float __y) { return __ocml_sub_rte_f32(__x, __y); }

__DEVICE__

float __fsub_ru(float __x, float __y) { return __ocml_sub_rtp_f32(__x, __y); }

__DEVICE__

float __fsub_rz(float __x, float __y) { return __ocml_sub_rtz_f32(__x, __y); }

#else

__DEVICE__

float __fsub_rn(float __x, float __y) { return __x - __y; }

#endif


__DEVICE__

float __log10f(float __x) { return __builtin_log10f(__x); }


__DEVICE__

float __log2f(float __x) { return __builtin_amdgcn_logf(__x); }


__DEVICE__

float __logf(float __x) { return __builtin_logf(__x); }


__DEVICE__

float __powf(float __x, float __y) { return __ocml_pow_f32(__x, __y); }


__DEVICE__

float __saturatef(float __x) { return (__x < 0) ? 0 : ((__x > 1) ? 1 : __x); }


__DEVICE__

void __sincosf(float __x, float *__sinptr, float *__cosptr) {

  *__sinptr = __ocml_native_sin_f32(__x);

  *__cosptr = __ocml_native_cos_f32(__x);

}


__DEVICE__

float __sinf(float __x) { return __ocml_native_sin_f32(__x); }


__DEVICE__

float __tanf(float __x) {

  return __sinf(__x) * __builtin_amdgcn_rcpf(__cosf(__x));

}

// END INTRINSICS


#if defined(__cplusplus)

__DEVICE__

int abs(int __x) {

  return __builtin_abs(__x);

}

__DEVICE__

long labs(long __x) {

  return __builtin_labs(__x);

}

__DEVICE__

long long llabs(long long __x) {

  return __builtin_llabs(__x);

}

#endif


__DEVICE__

float acosf(float __x) { return __ocml_acos_f32(__x); }


__DEVICE__

float acoshf(float __x) { return __ocml_acosh_f32(__x); }


__DEVICE__

float asinf(float __x) { return __ocml_asin_f32(__x); }


__DEVICE__

float asinhf(float __x) { return __ocml_asinh_f32(__x); }


__DEVICE__

float atan2f(float __x, float __y) { return __ocml_atan2_f32(__x, __y); }


__DEVICE__

float atanf(float __x) { return __ocml_atan_f32(__x); }


__DEVICE__

float atanhf(float __x) { return __ocml_atanh_f32(__x); }


__DEVICE__

float cbrtf(float __x) { return __ocml_cbrt_f32(__x); }


__DEVICE__

float ceilf(float __x) { return __builtin_ceilf(__x); }


__DEVICE__

float copysignf(float __x, float __y) { return __builtin_copysignf(__x, __y); }


__DEVICE__

float cosf(float __x) { return __FAST_OR_SLOW(__cosf, __ocml_cos_f32)(__x); }


__DEVICE__

float coshf(float __x) { return __ocml_cosh_f32(__x); }


__DEVICE__

float cospif(float __x) { return __ocml_cospi_f32(__x); }


__DEVICE__

float cyl_bessel_i0f(float __x) { return __ocml_i0_f32(__x); }


__DEVICE__

float cyl_bessel_i1f(float __x) { return __ocml_i1_f32(__x); }


__DEVICE__

float erfcf(float __x) { return __ocml_erfc_f32(__x); }


__DEVICE__

float erfcinvf(float __x) { return __ocml_erfcinv_f32(__x); }


__DEVICE__

float erfcxf(float __x) { return __ocml_erfcx_f32(__x); }


__DEVICE__

float erff(float __x) { return __ocml_erf_f32(__x); }


__DEVICE__

float erfinvf(float __x) { return __ocml_erfinv_f32(__x); }


__DEVICE__

float exp10f(float __x) { return __ocml_exp10_f32(__x); }


__DEVICE__

float exp2f(float __x) { return __builtin_exp2f(__x); }


__DEVICE__

float expf(float __x) { return __builtin_expf(__x); }


__DEVICE__

float expm1f(float __x) { return __ocml_expm1_f32(__x); }


__DEVICE__

float fabsf(float __x) { return __builtin_fabsf(__x); }


__DEVICE__

float fdimf(float __x, float __y) { return __ocml_fdim_f32(__x, __y); }


__DEVICE__

float fdividef(float __x, float __y) { return __x / __y; }


__DEVICE__

float floorf(float __x) { return __builtin_floorf(__x); }


__DEVICE__

float fmaf(float __x, float __y, float __z) {

  return __builtin_fmaf(__x, __y, __z);

}


__DEVICE__

float fmaxf(float __x, float __y) { return __builtin_fmaxf(__x, __y); }


__DEVICE__

float fminf(float __x, float __y) { return __builtin_fminf(__x, __y); }


__DEVICE__

float fmodf(float __x, float __y) { return __ocml_fmod_f32(__x, __y); }


__DEVICE__

float frexpf(float __x, int *__nptr) {

  return __builtin_frexpf(__x, __nptr);

}


__DEVICE__

float hypotf(float __x, float __y) { return __ocml_hypot_f32(__x, __y); }


__DEVICE__

int ilogbf(float __x) { return __ocml_ilogb_f32(__x); }


__DEVICE__

__RETURN_TYPE __finitef(float __x) { return __builtin_isfinite(__x); }


__DEVICE__

__RETURN_TYPE __isinff(float __x) { return __builtin_isinf(__x); }


__DEVICE__

__RETURN_TYPE __isnanf(float __x) { return __builtin_isnan(__x); }


__DEVICE__

float j0f(float __x) { return __ocml_j0_f32(__x); }


__DEVICE__

float j1f(float __x) { return __ocml_j1_f32(__x); }


__DEVICE__

float jnf(int __n, float __x) { // TODO: we could use Ahmes multiplication

                                // and the Miller & Brown algorithm

  //       for linear recurrences to get O(log n) steps, but it's unclear if

  //       it'd be beneficial in this case.

  if (__n == 0)

    return j0f(__x);

  if (__n == 1)

    return j1f(__x);


  float __x0 = j0f(__x);

  float __x1 = j1f(__x);

  for (int __i = 1; __i < __n; ++__i) {

    float __x2 = (2 * __i) / __x * __x1 - __x0;

    __x0 = __x1;

    __x1 = __x2;

  }


  return __x1;

}


__DEVICE__

float ldexpf(float __x, int __e) { return __builtin_amdgcn_ldexpf(__x, __e); }


__DEVICE__

float lgammaf(float __x) { return __ocml_lgamma_f32(__x); }


__DEVICE__

long long int llrintf(float __x) { return __builtin_rintf(__x); }


__DEVICE__

long long int llroundf(float __x) { return __builtin_roundf(__x); }


__DEVICE__

float log10f(float __x) { return __builtin_log10f(__x); }


__DEVICE__

float log1pf(float __x) { return __ocml_log1p_f32(__x); }


__DEVICE__

float log2f(float __x) { return __FAST_OR_SLOW(__log2f, __ocml_log2_f32)(__x); }


__DEVICE__

float logbf(float __x) { return __ocml_logb_f32(__x); }


__DEVICE__

float logf(float __x) { return __FAST_OR_SLOW(__logf, __ocml_log_f32)(__x); }


__DEVICE__

long int lrintf(float __x) { return __builtin_rintf(__x); }


__DEVICE__

long int lroundf(float __x) { return __builtin_roundf(__x); }


__DEVICE__

float modff(float __x, float *__iptr) {

  float __tmp;

#ifdef __OPENMP_AMDGCN__

#pragma omp allocate(__tmp) allocator(omp_thread_mem_alloc)

#endif

  float __r =

      __ocml_modf_f32(__x, (__attribute__((address_space(5))) float *)&__tmp);

  *__iptr = __tmp;

  return __r;

}


__DEVICE__

float nanf(const char *__tagp __attribute__((nonnull))) {

  union {

    float val;

    struct ieee_float {

      unsigned int mantissa : 22;

      unsigned int quiet : 1;

      unsigned int exponent : 8;

      unsigned int sign : 1;

    } bits;

  } __tmp;

  __static_assert_type_size_equal(sizeof(__tmp.val), sizeof(__tmp.bits));


  __tmp.bits.sign = 0u;

  __tmp.bits.exponent = ~0u;

  __tmp.bits.quiet = 1u;

  __tmp.bits.mantissa = __make_mantissa(__tagp);


  return __tmp.val;

}


__DEVICE__

float nearbyintf(float __x) { return __builtin_nearbyintf(__x); }


__DEVICE__

float nextafterf(float __x, float __y) {

  return __ocml_nextafter_f32(__x, __y);

}


__DEVICE__

float norm3df(float __x, float __y, float __z) {

  return __ocml_len3_f32(__x, __y, __z);

}


__DEVICE__

float norm4df(float __x, float __y, float __z, float __w) {

  return __ocml_len4_f32(__x, __y, __z, __w);

}


__DEVICE__

float normcdff(float __x) { return __ocml_ncdf_f32(__x); }


__DEVICE__

float normcdfinvf(float __x) { return __ocml_ncdfinv_f32(__x); }


__DEVICE__

float normf(int __dim,

            const float *__a) { // TODO: placeholder until OCML adds support.

  float __r = 0;

  while (__dim--) {

    __r += __a[0] * __a[0];

    ++__a;

  }


  return __builtin_sqrtf(__r);

}


__DEVICE__

float powf(float __x, float __y) { return __ocml_pow_f32(__x, __y); }


__DEVICE__

float powif(float __x, int __y) { return __ocml_pown_f32(__x, __y); }


__DEVICE__

float rcbrtf(float __x) { return __ocml_rcbrt_f32(__x); }


__DEVICE__

float remainderf(float __x, float __y) {

  return __ocml_remainder_f32(__x, __y);

}


__DEVICE__

float remquof(float __x, float __y, int *__quo) {

  int __tmp;

#ifdef __OPENMP_AMDGCN__

#pragma omp allocate(__tmp) allocator(omp_thread_mem_alloc)

#endif

  float __r = __ocml_remquo_f32(

      __x, __y, (__attribute__((address_space(5))) int *)&__tmp);

  *__quo = __tmp;


  return __r;

}


__DEVICE__

float rhypotf(float __x, float __y) { return __ocml_rhypot_f32(__x, __y); }


__DEVICE__

float rintf(float __x) { return __builtin_rintf(__x); }


__DEVICE__

float rnorm3df(float __x, float __y, float __z) {

  return __ocml_rlen3_f32(__x, __y, __z);

}


__DEVICE__

float rnorm4df(float __x, float __y, float __z, float __w) {

  return __ocml_rlen4_f32(__x, __y, __z, __w);

}


__DEVICE__

float rnormf(int __dim,

             const float *__a) { // TODO: placeholder until OCML adds support.

  float __r = 0;

  while (__dim--) {

    __r += __a[0] * __a[0];

    ++__a;

  }


  return __ocml_rsqrt_f32(__r);

}


__DEVICE__

float roundf(float __x) { return __builtin_roundf(__x); }


__DEVICE__

float rsqrtf(float __x) { return __ocml_rsqrt_f32(__x); }


__DEVICE__

float scalblnf(float __x, long int __n) {

  return (__n < INT_MAX) ? __builtin_amdgcn_ldexpf(__x, __n)

                         : __ocml_scalb_f32(__x, __n);

}


__DEVICE__

float scalbnf(float __x, int __n) { return __builtin_amdgcn_ldexpf(__x, __n); }


__DEVICE__

__RETURN_TYPE __signbitf(float __x) { return __builtin_signbitf(__x); }


__DEVICE__

void sincosf(float __x, float *__sinptr, float *__cosptr) {

  float __tmp;

#ifdef __OPENMP_AMDGCN__

#pragma omp allocate(__tmp) allocator(omp_thread_mem_alloc)

#endif

#ifdef __CLANG_CUDA_APPROX_TRANSCENDENTALS__

  __sincosf(__x, __sinptr, __cosptr);

#else

  *__sinptr =

      __ocml_sincos_f32(__x, (__attribute__((address_space(5))) float *)&__tmp);

  *__cosptr = __tmp;

#endif

}


__DEVICE__

void sincospif(float __x, float *__sinptr, float *__cosptr) {

  float __tmp;

#ifdef __OPENMP_AMDGCN__

#pragma omp allocate(__tmp) allocator(omp_thread_mem_alloc)

#endif

  *__sinptr = __ocml_sincospi_f32(

      __x, (__attribute__((address_space(5))) float *)&__tmp);

  *__cosptr = __tmp;

}


__DEVICE__

float sinf(float __x) { return __FAST_OR_SLOW(__sinf, __ocml_sin_f32)(__x); }


__DEVICE__

float sinhf(float __x) { return __ocml_sinh_f32(__x); }


__DEVICE__

float sinpif(float __x) { return __ocml_sinpi_f32(__x); }


__DEVICE__

float sqrtf(float __x) { return __builtin_sqrtf(__x); }


__DEVICE__

float tanf(float __x) { return __ocml_tan_f32(__x); }


__DEVICE__

float tanhf(float __x) { return __ocml_tanh_f32(__x); }


__DEVICE__

float tgammaf(float __x) { return __ocml_tgamma_f32(__x); }


__DEVICE__

float truncf(float __x) { return __builtin_truncf(__x); }


__DEVICE__

float y0f(float __x) { return __ocml_y0_f32(__x); }


__DEVICE__

float y1f(float __x) { return __ocml_y1_f32(__x); }


__DEVICE__

float ynf(int __n, float __x) { // TODO: we could use Ahmes multiplication

                                // and the Miller & Brown algorithm

  //       for linear recurrences to get O(log n) steps, but it's unclear if

  //       it'd be beneficial in this case. Placeholder until OCML adds

  //       support.

  if (__n == 0)

    return y0f(__x);

  if (__n == 1)

    return y1f(__x);


  float __x0 = y0f(__x);

  float __x1 = y1f(__x);

  for (int __i = 1; __i < __n; ++__i) {

    float __x2 = (2 * __i) / __x * __x1 - __x0;

    __x0 = __x1;

    __x1 = __x2;

  }


  return __x1;

}


// END FLOAT


// BEGIN DOUBLE

__DEVICE__

double acos(double __x) { return __ocml_acos_f64(__x); }


__DEVICE__

double acosh(double __x) { return __ocml_acosh_f64(__x); }


__DEVICE__

double asin(double __x) { return __ocml_asin_f64(__x); }


__DEVICE__

double asinh(double __x) { return __ocml_asinh_f64(__x); }


__DEVICE__

double atan(double __x) { return __ocml_atan_f64(__x); }


__DEVICE__

double atan2(double __x, double __y) { return __ocml_atan2_f64(__x, __y); }


__DEVICE__

double atanh(double __x) { return __ocml_atanh_f64(__x); }


__DEVICE__

double cbrt(double __x) { return __ocml_cbrt_f64(__x); }


__DEVICE__

double ceil(double __x) { return __builtin_ceil(__x); }


__DEVICE__

double copysign(double __x, double __y) {

  return __builtin_copysign(__x, __y);

}


__DEVICE__

double cos(double __x) { return __ocml_cos_f64(__x); }


__DEVICE__

double cosh(double __x) { return __ocml_cosh_f64(__x); }


__DEVICE__

double cospi(double __x) { return __ocml_cospi_f64(__x); }


__DEVICE__

double cyl_bessel_i0(double __x) { return __ocml_i0_f64(__x); }


__DEVICE__

double cyl_bessel_i1(double __x) { return __ocml_i1_f64(__x); }


__DEVICE__

double erf(double __x) { return __ocml_erf_f64(__x); }


__DEVICE__

double erfc(double __x) { return __ocml_erfc_f64(__x); }


__DEVICE__

double erfcinv(double __x) { return __ocml_erfcinv_f64(__x); }


__DEVICE__

double erfcx(double __x) { return __ocml_erfcx_f64(__x); }


__DEVICE__

double erfinv(double __x) { return __ocml_erfinv_f64(__x); }


__DEVICE__

double exp(double __x) { return __ocml_exp_f64(__x); }


__DEVICE__

double exp10(double __x) { return __ocml_exp10_f64(__x); }


__DEVICE__

double exp2(double __x) { return __ocml_exp2_f64(__x); }


__DEVICE__

double expm1(double __x) { return __ocml_expm1_f64(__x); }


__DEVICE__

double fabs(double __x) { return __builtin_fabs(__x); }


__DEVICE__

double fdim(double __x, double __y) { return __ocml_fdim_f64(__x, __y); }


__DEVICE__

double floor(double __x) { return __builtin_floor(__x); }


__DEVICE__

double fma(double __x, double __y, double __z) {

  return __builtin_fma(__x, __y, __z);

}


__DEVICE__

double fmax(double __x, double __y) { return __builtin_fmax(__x, __y); }


__DEVICE__

double fmin(double __x, double __y) { return __builtin_fmin(__x, __y); }


__DEVICE__

double fmod(double __x, double __y) { return __ocml_fmod_f64(__x, __y); }


__DEVICE__

double frexp(double __x, int *__nptr) {

  return __builtin_frexp(__x, __nptr);

}


__DEVICE__

double hypot(double __x, double __y) { return __ocml_hypot_f64(__x, __y); }


__DEVICE__

int ilogb(double __x) { return __ocml_ilogb_f64(__x); }


__DEVICE__

__RETURN_TYPE __finite(double __x) { return __builtin_isfinite(__x); }


__DEVICE__

__RETURN_TYPE __isinf(double __x) { return __builtin_isinf(__x); }


__DEVICE__

__RETURN_TYPE __isnan(double __x) { return __builtin_isnan(__x); }


__DEVICE__

double j0(double __x) { return __ocml_j0_f64(__x); }


__DEVICE__

double j1(double __x) { return __ocml_j1_f64(__x); }


__DEVICE__

double jn(int __n, double __x) { // TODO: we could use Ahmes multiplication

                                 // and the Miller & Brown algorithm

  //       for linear recurrences to get O(log n) steps, but it's unclear if

  //       it'd be beneficial in this case. Placeholder until OCML adds

  //       support.

  if (__n == 0)

    return j0(__x);

  if (__n == 1)

    return j1(__x);


  double __x0 = j0(__x);

  double __x1 = j1(__x);

  for (int __i = 1; __i < __n; ++__i) {

    double __x2 = (2 * __i) / __x * __x1 - __x0;

    __x0 = __x1;

    __x1 = __x2;

  }

  return __x1;

}


__DEVICE__

double ldexp(double __x, int __e) { return __builtin_amdgcn_ldexp(__x, __e); }


__DEVICE__

double lgamma(double __x) { return __ocml_lgamma_f64(__x); }


__DEVICE__

long long int llrint(double __x) { return __builtin_rint(__x); }


__DEVICE__

long long int llround(double __x) { return __builtin_round(__x); }


__DEVICE__

double log(double __x) { return __ocml_log_f64(__x); }


__DEVICE__

double log10(double __x) { return __ocml_log10_f64(__x); }


__DEVICE__

double log1p(double __x) { return __ocml_log1p_f64(__x); }


__DEVICE__

double log2(double __x) { return __ocml_log2_f64(__x); }


__DEVICE__

double logb(double __x) { return __ocml_logb_f64(__x); }


__DEVICE__

long int lrint(double __x) { return __builtin_rint(__x); }


__DEVICE__

long int lround(double __x) { return __builtin_round(__x); }


__DEVICE__

double modf(double __x, double *__iptr) {

  double __tmp;

#ifdef __OPENMP_AMDGCN__

#pragma omp allocate(__tmp) allocator(omp_thread_mem_alloc)

#endif

  double __r =

      __ocml_modf_f64(__x, (__attribute__((address_space(5))) double *)&__tmp);

  *__iptr = __tmp;


  return __r;

}


__DEVICE__

double nan(const char *__tagp) {

#if !_WIN32

  union {

    double val;

    struct ieee_double {

      uint64_t mantissa : 51;

      uint32_t quiet : 1;

      uint32_t exponent : 11;

      uint32_t sign : 1;

    } bits;

  } __tmp;

  __static_assert_type_size_equal(sizeof(__tmp.val), sizeof(__tmp.bits));


  __tmp.bits.sign = 0u;

  __tmp.bits.exponent = ~0u;

  __tmp.bits.quiet = 1u;

  __tmp.bits.mantissa = __make_mantissa(__tagp);


  return __tmp.val;

#else

  __static_assert_type_size_equal(sizeof(uint64_t), sizeof(double));

  uint64_t __val = __make_mantissa(__tagp);

  __val |= 0xFFF << 51;

  return *reinterpret_cast<double *>(&__val);

#endif

}


__DEVICE__

double nearbyint(double __x) { return __builtin_nearbyint(__x); }


__DEVICE__

double nextafter(double __x, double __y) {

  return __ocml_nextafter_f64(__x, __y);

}


__DEVICE__

double norm(int __dim,

            const double *__a) { // TODO: placeholder until OCML adds support.

  double __r = 0;

  while (__dim--) {

    __r += __a[0] * __a[0];

    ++__a;

  }


  return __builtin_sqrt(__r);

}


__DEVICE__

double norm3d(double __x, double __y, double __z) {

  return __ocml_len3_f64(__x, __y, __z);

}


__DEVICE__

double norm4d(double __x, double __y, double __z, double __w) {

  return __ocml_len4_f64(__x, __y, __z, __w);

}


__DEVICE__

double normcdf(double __x) { return __ocml_ncdf_f64(__x); }


__DEVICE__

double normcdfinv(double __x) { return __ocml_ncdfinv_f64(__x); }


__DEVICE__

double pow(double __x, double __y) { return __ocml_pow_f64(__x, __y); }


__DEVICE__

double powi(double __x, int __y) { return __ocml_pown_f64(__x, __y); }


__DEVICE__

double rcbrt(double __x) { return __ocml_rcbrt_f64(__x); }


__DEVICE__

double remainder(double __x, double __y) {

  return __ocml_remainder_f64(__x, __y);

}


__DEVICE__

double remquo(double __x, double __y, int *__quo) {

  int __tmp;

#ifdef __OPENMP_AMDGCN__

#pragma omp allocate(__tmp) allocator(omp_thread_mem_alloc)

#endif

  double __r = __ocml_remquo_f64(

      __x, __y, (__attribute__((address_space(5))) int *)&__tmp);

  *__quo = __tmp;


  return __r;

}


__DEVICE__

double rhypot(double __x, double __y) { return __ocml_rhypot_f64(__x, __y); }


__DEVICE__

double rint(double __x) { return __builtin_rint(__x); }


__DEVICE__

double rnorm(int __dim,

             const double *__a) { // TODO: placeholder until OCML adds support.

  double __r = 0;

  while (__dim--) {

    __r += __a[0] * __a[0];

    ++__a;

  }


  return __ocml_rsqrt_f64(__r);

}


__DEVICE__

double rnorm3d(double __x, double __y, double __z) {

  return __ocml_rlen3_f64(__x, __y, __z);

}


__DEVICE__

double rnorm4d(double __x, double __y, double __z, double __w) {

  return __ocml_rlen4_f64(__x, __y, __z, __w);

}


__DEVICE__

double round(double __x) { return __builtin_round(__x); }


__DEVICE__

double rsqrt(double __x) { return __ocml_rsqrt_f64(__x); }


__DEVICE__

double scalbln(double __x, long int __n) {

  return (__n < INT_MAX) ? __builtin_amdgcn_ldexp(__x, __n)

                         : __ocml_scalb_f64(__x, __n);

}

__DEVICE__

double scalbn(double __x, int __n) { return __builtin_amdgcn_ldexp(__x, __n); }


__DEVICE__

__RETURN_TYPE __signbit(double __x) { return __builtin_signbit(__x); }


__DEVICE__

double sin(double __x) { return __ocml_sin_f64(__x); }


__DEVICE__

void sincos(double __x, double *__sinptr, double *__cosptr) {

  double __tmp;

#ifdef __OPENMP_AMDGCN__

#pragma omp allocate(__tmp) allocator(omp_thread_mem_alloc)

#endif

  *__sinptr = __ocml_sincos_f64(

      __x, (__attribute__((address_space(5))) double *)&__tmp);

  *__cosptr = __tmp;

}


__DEVICE__

void sincospi(double __x, double *__sinptr, double *__cosptr) {

  double __tmp;

#ifdef __OPENMP_AMDGCN__

#pragma omp allocate(__tmp) allocator(omp_thread_mem_alloc)

#endif

  *__sinptr = __ocml_sincospi_f64(

      __x, (__attribute__((address_space(5))) double *)&__tmp);

  *__cosptr = __tmp;

}


__DEVICE__

double sinh(double __x) { return __ocml_sinh_f64(__x); }


__DEVICE__

double sinpi(double __x) { return __ocml_sinpi_f64(__x); }


__DEVICE__

double sqrt(double __x) { return __builtin_sqrt(__x); }


__DEVICE__

double tan(double __x) { return __ocml_tan_f64(__x); }


__DEVICE__

double tanh(double __x) { return __ocml_tanh_f64(__x); }


__DEVICE__

double tgamma(double __x) { return __ocml_tgamma_f64(__x); }


__DEVICE__

double trunc(double __x) { return __builtin_trunc(__x); }


__DEVICE__

double y0(double __x) { return __ocml_y0_f64(__x); }


__DEVICE__

double y1(double __x) { return __ocml_y1_f64(__x); }


__DEVICE__

double yn(int __n, double __x) { // TODO: we could use Ahmes multiplication

                                 // and the Miller & Brown algorithm

  //       for linear recurrences to get O(log n) steps, but it's unclear if

  //       it'd be beneficial in this case. Placeholder until OCML adds

  //       support.

  if (__n == 0)

    return y0(__x);

  if (__n == 1)

    return y1(__x);


  double __x0 = y0(__x);

  double __x1 = y1(__x);

  for (int __i = 1; __i < __n; ++__i) {

    double __x2 = (2 * __i) / __x * __x1 - __x0;

    __x0 = __x1;

    __x1 = __x2;

  }


  return __x1;

}


// BEGIN INTRINSICS

#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

double __dadd_rd(double __x, double __y) {

  return __ocml_add_rtn_f64(__x, __y);

}

__DEVICE__

double __dadd_rn(double __x, double __y) {

  return __ocml_add_rte_f64(__x, __y);

}

__DEVICE__

double __dadd_ru(double __x, double __y) {

  return __ocml_add_rtp_f64(__x, __y);

}

__DEVICE__

double __dadd_rz(double __x, double __y) {

  return __ocml_add_rtz_f64(__x, __y);

}

#else

__DEVICE__

double __dadd_rn(double __x, double __y) { return __x + __y; }

#endif


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

double __ddiv_rd(double __x, double __y) {

  return __ocml_div_rtn_f64(__x, __y);

}

__DEVICE__

double __ddiv_rn(double __x, double __y) {

  return __ocml_div_rte_f64(__x, __y);

}

__DEVICE__

double __ddiv_ru(double __x, double __y) {

  return __ocml_div_rtp_f64(__x, __y);

}

__DEVICE__

double __ddiv_rz(double __x, double __y) {

  return __ocml_div_rtz_f64(__x, __y);

}

#else

__DEVICE__

double __ddiv_rn(double __x, double __y) { return __x / __y; }

#endif


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

double __dmul_rd(double __x, double __y) {

  return __ocml_mul_rtn_f64(__x, __y);

}

__DEVICE__

double __dmul_rn(double __x, double __y) {

  return __ocml_mul_rte_f64(__x, __y);

}

__DEVICE__

double __dmul_ru(double __x, double __y) {

  return __ocml_mul_rtp_f64(__x, __y);

}

__DEVICE__

double __dmul_rz(double __x, double __y) {

  return __ocml_mul_rtz_f64(__x, __y);

}

#else

__DEVICE__

double __dmul_rn(double __x, double __y) { return __x * __y; }

#endif


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

double __drcp_rd(double __x) { return __ocml_div_rtn_f64(1.0, __x); }

__DEVICE__

double __drcp_rn(double __x) { return __ocml_div_rte_f64(1.0, __x); }

__DEVICE__

double __drcp_ru(double __x) { return __ocml_div_rtp_f64(1.0, __x); }

__DEVICE__

double __drcp_rz(double __x) { return __ocml_div_rtz_f64(1.0, __x); }

#else

__DEVICE__

double __drcp_rn(double __x) { return 1.0 / __x; }

#endif


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

double __dsqrt_rd(double __x) { return __ocml_sqrt_rtn_f64(__x); }

__DEVICE__

double __dsqrt_rn(double __x) { return __ocml_sqrt_rte_f64(__x); }

__DEVICE__

double __dsqrt_ru(double __x) { return __ocml_sqrt_rtp_f64(__x); }

__DEVICE__

double __dsqrt_rz(double __x) { return __ocml_sqrt_rtz_f64(__x); }

#else

__DEVICE__

double __dsqrt_rn(double __x) { return __builtin_sqrt(__x); }

#endif


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

double __dsub_rd(double __x, double __y) {

  return __ocml_sub_rtn_f64(__x, __y);

}

__DEVICE__

double __dsub_rn(double __x, double __y) {

  return __ocml_sub_rte_f64(__x, __y);

}

__DEVICE__

double __dsub_ru(double __x, double __y) {

  return __ocml_sub_rtp_f64(__x, __y);

}

__DEVICE__

double __dsub_rz(double __x, double __y) {

  return __ocml_sub_rtz_f64(__x, __y);

}

#else

__DEVICE__

double __dsub_rn(double __x, double __y) { return __x - __y; }

#endif


#if defined OCML_BASIC_ROUNDED_OPERATIONS

__DEVICE__

double __fma_rd(double __x, double __y, double __z) {

  return __ocml_fma_rtn_f64(__x, __y, __z);

}

__DEVICE__

double __fma_rn(double __x, double __y, double __z) {

  return __ocml_fma_rte_f64(__x, __y, __z);

}

__DEVICE__

double __fma_ru(double __x, double __y, double __z) {

  return __ocml_fma_rtp_f64(__x, __y, __z);

}

__DEVICE__

double __fma_rz(double __x, double __y, double __z) {

  return __ocml_fma_rtz_f64(__x, __y, __z);

}

#else

__DEVICE__

double __fma_rn(double __x, double __y, double __z) {

  return __builtin_fma(__x, __y, __z);

}

#endif

// END INTRINSICS

// END DOUBLE


// C only macros

#if !defined(__cplusplus) && __STDC_VERSION__ >= 201112L

#define isfinite(__x) _Generic((__x), float : __finitef, double : __finite)(__x)

#define isinf(__x) _Generic((__x), float : __isinff, double : __isinf)(__x)

#define isnan(__x) _Generic((__x), float : __isnanf, double : __isnan)(__x)

#define signbit(__x)                                                           \

  _Generic((__x), float : __signbitf, double : __signbit)(__x)

#endif // !defined(__cplusplus) && __STDC_VERSION__ >= 201112L


#if defined(__cplusplus)

template <class T> __DEVICE__ T min(T __arg1, T __arg2) {

  return (__arg1 < __arg2) ? __arg1 : __arg2;

}


template <class T> __DEVICE__ T max(T __arg1, T __arg2) {

  return (__arg1 > __arg2) ? __arg1 : __arg2;

}


__DEVICE__ int min(int __arg1, int __arg2) {

  return (__arg1 < __arg2) ? __arg1 : __arg2;

}

__DEVICE__ int max(int __arg1, int __arg2) {

  return (__arg1 > __arg2) ? __arg1 : __arg2;

}


__DEVICE__

float max(float __x, float __y) { return __builtin_fmaxf(__x, __y); }


__DEVICE__

double max(double __x, double __y) { return __builtin_fmax(__x, __y); }


__DEVICE__

float min(float __x, float __y) { return __builtin_fminf(__x, __y); }


__DEVICE__

double min(double __x, double __y) { return __builtin_fmin(__x, __y); }


#if !defined(__HIPCC_RTC__) && !defined(__OPENMP_AMDGCN__)

__host__ inline static int min(int __arg1, int __arg2) {

  return __arg1 < __arg2 ? __arg1 : __arg2;

}


__host__ inline static int max(int __arg1, int __arg2) {

  return __arg1 > __arg2 ? __arg1 : __arg2;

}

#endif // !defined(__HIPCC_RTC__) && !defined(__OPENMP_AMDGCN__)

#endif


#pragma pop_macro("__DEVICE__")

#pragma pop_macro("__RETURN_TYPE")

#pragma pop_macro("__FAST_OR_SLOW")


#endif // __CLANG_GPU_DISABLE_MATH_WRAPPERS

#endif // __CLANG_HIP_MATH_H__

abs
__DEVICE__ long long abs(long long __n)
Definition: __clang_cuda_cmath.h:41

__fsqrt_rd
__DEVICE__ float __fsqrt_rd(float __a)
Definition: __clang_cuda_device_functions.h:320

__fdiv_rd
__DEVICE__ float __fdiv_rd(float __a, float __b)
Definition: __clang_cuda_device_functions.h:209

__dsub_ru
__DEVICE__ double __dsub_ru(double __a, double __b)
Definition: __clang_cuda_device_functions.h:168

__drcp_ru
__DEVICE__ double __drcp_ru(double __a)
Definition: __clang_cuda_device_functions.h:156

__frcp_rz
__DEVICE__ float __frcp_rz(float __a)
Definition: __clang_cuda_device_functions.h:318

__fmul_ru
__DEVICE__ float __fmul_ru(float __a, float __b)
Definition: __clang_cuda_device_functions.h:309

__dsub_rd
__DEVICE__ double __dsub_rd(double __a, double __b)
Definition: __clang_cuda_device_functions.h:162

__frcp_ru
__DEVICE__ float __frcp_ru(float __a)
Definition: __clang_cuda_device_functions.h:317

__frcp_rd
__DEVICE__ float __frcp_rd(float __a)
Definition: __clang_cuda_device_functions.h:315

__dmul_ru
__DEVICE__ double __dmul_ru(double __a, double __b)
Definition: __clang_cuda_device_functions.h:91

__fmaf_ru
__DEVICE__ float __fmaf_ru(float __a, float __b, float __c)
Definition: __clang_cuda_device_functions.h:297

__fma_rz
__DEVICE__ double __fma_rz(double __a, double __b, double __c)
Definition: __clang_cuda_device_functions.h:276

__fma_rd
__DEVICE__ double __fma_rd(double __a, double __b, double __c)
Definition: __clang_cuda_device_functions.h:267

__dmul_rd
__DEVICE__ double __dmul_rd(double __a, double __b)
Definition: __clang_cuda_device_functions.h:85

__ddiv_ru
__DEVICE__ double __ddiv_ru(double __a, double __b)
Definition: __clang_cuda_device_functions.h:79

__ddiv_rd
__DEVICE__ double __ddiv_rd(double __a, double __b)
Definition: __clang_cuda_device_functions.h:73

__dadd_ru
__DEVICE__ double __dadd_ru(double __a, double __b)
Definition: __clang_cuda_device_functions.h:67

__fmul_rd
__DEVICE__ float __fmul_rd(float __a, float __b)
Definition: __clang_cuda_device_functions.h:303

__fsub_rd
__DEVICE__ float __fsub_rd(float __a, float __b)
Definition: __clang_cuda_device_functions.h:324

__fsub_rz
__DEVICE__ float __fsub_rz(float __a, float __b)
Definition: __clang_cuda_device_functions.h:333

__fma_ru
__DEVICE__ double __fma_ru(double __a, double __b, double __c)
Definition: __clang_cuda_device_functions.h:273

__dsqrt_ru
__DEVICE__ double __dsqrt_ru(double __a)
Definition: __clang_cuda_device_functions.h:160

__fsqrt_rz
__DEVICE__ float __fsqrt_rz(float __a)
Definition: __clang_cuda_device_functions.h:323

__dsub_rz
__DEVICE__ double __dsub_rz(double __a, double __b)
Definition: __clang_cuda_device_functions.h:171

__fadd_rd
__DEVICE__ float __fadd_rd(float __a, float __b)
Definition: __clang_cuda_device_functions.h:197

__fmul_rz
__DEVICE__ float __fmul_rz(float __a, float __b)
Definition: __clang_cuda_device_functions.h:312

__fadd_rz
__DEVICE__ float __fadd_rz(float __a, float __b)
Definition: __clang_cuda_device_functions.h:206

__dsqrt_rd
__DEVICE__ double __dsqrt_rd(double __a)
Definition: __clang_cuda_device_functions.h:158

__fmaf_rd
__DEVICE__ float __fmaf_rd(float __a, float __b, float __c)
Definition: __clang_cuda_device_functions.h:291

__dadd_rd
__DEVICE__ double __dadd_rd(double __a, double __b)
Definition: __clang_cuda_device_functions.h:61

__dsqrt_rz
__DEVICE__ double __dsqrt_rz(double __a)
Definition: __clang_cuda_device_functions.h:161

__drcp_rd
__DEVICE__ double __drcp_rd(double __a)
Definition: __clang_cuda_device_functions.h:154

__fdiv_rz
__DEVICE__ float __fdiv_rz(float __a, float __b)
Definition: __clang_cuda_device_functions.h:218

__fmaf_rz
__DEVICE__ float __fmaf_rz(float __a, float __b, float __c)
Definition: __clang_cuda_device_functions.h:300

__drcp_rz
__DEVICE__ double __drcp_rz(double __a)
Definition: __clang_cuda_device_functions.h:157

__fsub_ru
__DEVICE__ float __fsub_ru(float __a, float __b)
Definition: __clang_cuda_device_functions.h:330

__dmul_rz
__DEVICE__ double __dmul_rz(double __a, double __b)
Definition: __clang_cuda_device_functions.h:94

__fsqrt_ru
__DEVICE__ float __fsqrt_ru(float __a)
Definition: __clang_cuda_device_functions.h:322

__fadd_ru
__DEVICE__ float __fadd_ru(float __a, float __b)
Definition: __clang_cuda_device_functions.h:203

__fdiv_ru
__DEVICE__ float __fdiv_ru(float __a, float __b)
Definition: __clang_cuda_device_functions.h:215

__ddiv_rz
__DEVICE__ double __ddiv_rz(double __a, double __b)
Definition: __clang_cuda_device_functions.h:82

__dadd_rz
__DEVICE__ double __dadd_rz(double __a, double __b)
Definition: __clang_cuda_device_functions.h:70

labs
__DEVICE__ long labs(long __a)
Definition: __clang_cuda_math.h:156

llabs
__DEVICE__ long long llabs(long long __a)
Definition: __clang_cuda_math.h:162

min
__DEVICE__ int min(int __a, int __b)
Definition: __clang_cuda_math.h:201

max
__DEVICE__ int max(int __a, int __b)
Definition: __clang_cuda_math.h:200

__ocml_i0_f64
__device__ double __ocml_i0_f64(double)

__ocml_j1_f32
__device__ float __ocml_j1_f32(float)

__ocml_remquo_f64
__device__ double __ocml_remquo_f64(double, double, __attribute__((address_space(5))) int *)

__ocml_modf_f64
__device__ double __ocml_modf_f64(double, __attribute__((address_space(5))) double *)

__ocml_cospi_f32
__device__ float __ocml_cospi_f32(float)

__ocml_i0_f32
__device__ float __ocml_i0_f32(float)

__ocml_lgamma_f64
__device__ double __ocml_lgamma_f64(double)

b
__device__ __2f16 b
Definition: __clang_hip_libdevice_declares.h:303

__ocml_sincos_f32
__device__ float __ocml_sincos_f32(float, __attribute__((address_space(5))) float *)

__ocml_remquo_f32
__device__ float __ocml_remquo_f32(float, float, __attribute__((address_space(5))) int *)

__attribute__
_Float16 __2f16 __attribute__((ext_vector_type(2)))
Zeroes the upper 128 bits (bits 255:128) of all YMM registers.
Definition: __clang_hip_libdevice_declares.h:293

__ocml_y0_f32
__device__ float __ocml_y0_f32(float)

__ocml_modf_f32
__device__ float __ocml_modf_f32(float, __attribute__((address_space(5))) float *)

__ocml_i1_f32
__device__ float __ocml_i1_f32(float)

__ocml_lgamma_f32
__device__ float __ocml_lgamma_f32(float)

__ocml_sinpi_f64
__device__ double __ocml_sinpi_f64(double)

__ocml_cospi_f64
__device__ double __ocml_cospi_f64(double)

__ocml_tgamma_f64
__device__ double __ocml_tgamma_f64(double)

__ocml_tan_f32
__device__ float __ocml_tan_f32(float)

__ocml_tgamma_f32
__device__ float __ocml_tgamma_f32(float)

__ocml_sincos_f64
__device__ double __ocml_sincos_f64(double, __attribute__((address_space(5))) double *)

__ocml_sinpi_f32
__device__ float __ocml_sinpi_f32(float)

__ocml_j1_f64
__device__ double __ocml_j1_f64(double)

__ocml_y1_f64
__device__ double __ocml_y1_f64(double)

__ocml_j0_f64
__device__ double __ocml_j0_f64(double)

__ocml_cos_f32
__device__ float __ocml_cos_f32(float)

__ocml_y1_f32
__device__ float __ocml_y1_f32(float)

__ocml_j0_f32
__device__ float __ocml_j0_f32(float)

__ocml_cos_f64
__device__ double __ocml_cos_f64(double)

__ocml_i1_f64
__device__ double __ocml_i1_f64(double)

__ocml_sin_f64
__device__ double __ocml_sin_f64(double)

__ocml_sincospi_f64
__device__ double __ocml_sincospi_f64(double, __attribute__((address_space(5))) double *)

__ocml_sin_f32
__device__ float __ocml_sin_f32(float)

__ocml_sincospi_f32
__device__ float __ocml_sincospi_f32(float, __attribute__((address_space(5))) float *)

__ocml_native_sin_f32
__device__ float __ocml_native_sin_f32(float)

__ocml_native_cos_f32
__device__ float __ocml_native_cos_f32(float)

__ocml_y0_f64
__device__ double __ocml_y0_f64(double)

__ocml_tan_f64
__device__ double __ocml_tan_f64(double)

__dsub_rn
__DEVICE__ double __dsub_rn(double __x, double __y)
Definition: __clang_hip_math.h:1247

__isinff
__DEVICE__ __RETURN_TYPE __isinff(float __x)
Definition: __clang_hip_math.h:444

sinpif
__DEVICE__ float sinpif(float __x)
Definition: __clang_hip_math.h:684

tanf
__DEVICE__ float tanf(float __x)
Definition: __clang_hip_math.h:690

log2f
__DEVICE__ float log2f(float __x)
Definition: __clang_hip_math.h:495

y0f
__DEVICE__ float y0f(float __x)
Definition: __clang_hip_math.h:702

tanhf
__DEVICE__ float tanhf(float __x)
Definition: __clang_hip_math.h:693

coshf
__DEVICE__ float coshf(float __x)
Definition: __clang_hip_math.h:365

log10f
__DEVICE__ float log10f(float __x)
Definition: __clang_hip_math.h:489

j1f
__DEVICE__ float j1f(float __x)
Definition: __clang_hip_math.h:453

__finitef
__DEVICE__ __RETURN_TYPE __finitef(float __x)
Definition: __clang_hip_math.h:441

ldexpf
__DEVICE__ float ldexpf(float __x, int __e)
Definition: __clang_hip_math.h:477

llroundf
__DEVICE__ long long int llroundf(float __x)
Definition: __clang_hip_math.h:486

rhypot
__DEVICE__ double rhypot(double __x, double __y)
Definition: __clang_hip_math.h:1015

normcdfinv
__DEVICE__ double normcdfinv(double __x)
Definition: __clang_hip_math.h:985

norm3d
__DEVICE__ double norm3d(double __x, double __y, double __z)
Definition: __clang_hip_math.h:972

truncf
__DEVICE__ float truncf(float __x)
Definition: __clang_hip_math.h:699

remainderf
__DEVICE__ float remainderf(float __x, float __y)
Definition: __clang_hip_math.h:588

fabsf
__DEVICE__ float fabsf(float __x)
Definition: __clang_hip_math.h:404

__fdiv_rn
__DEVICE__ float __fdiv_rn(float __x, float __y)
Definition: __clang_hip_math.h:197

scalbnf
__DEVICE__ float scalbnf(float __x, int __n)
Definition: __clang_hip_math.h:646

cyl_bessel_i0f
__DEVICE__ float cyl_bessel_i0f(float __x)
Definition: __clang_hip_math.h:371

nanf
__DEVICE__ float nanf(const char *__tagp __attribute__((nonnull)))
Definition: __clang_hip_math.h:522

lgammaf
__DEVICE__ float lgammaf(float __x)
Definition: __clang_hip_math.h:480

cospif
__DEVICE__ float cospif(float __x)
Definition: __clang_hip_math.h:368

__signbitf
__DEVICE__ __RETURN_TYPE __signbitf(float __x)
Definition: __clang_hip_math.h:649

__dsqrt_rn
__DEVICE__ double __dsqrt_rn(double __x)
Definition: __clang_hip_math.h:1225

frexpf
__DEVICE__ float frexpf(float __x, int *__nptr)
Definition: __clang_hip_math.h:430

tgammaf
__DEVICE__ float tgammaf(float __x)
Definition: __clang_hip_math.h:696

__sinf
__DEVICE__ float __sinf(float __x)
Definition: __clang_hip_math.h:308

erfinvf
__DEVICE__ float erfinvf(float __x)
Definition: __clang_hip_math.h:389

modff
__DEVICE__ float modff(float __x, float *__iptr)
Definition: __clang_hip_math.h:510

erfinv
__DEVICE__ double erfinv(double __x)
Definition: __clang_hip_math.h:793

expm1f
__DEVICE__ float expm1f(float __x)
Definition: __clang_hip_math.h:401

sinhf
__DEVICE__ float sinhf(float __x)
Definition: __clang_hip_math.h:681

j0
__DEVICE__ double j0(double __x)
Definition: __clang_hip_math.h:851

y1f
__DEVICE__ float y1f(float __x)
Definition: __clang_hip_math.h:705

acosf
__DEVICE__ float acosf(float __x)
Definition: __clang_hip_math.h:332

fmaf
__DEVICE__ float fmaf(float __x, float __y, float __z)
Definition: __clang_hip_math.h:416

cyl_bessel_i1f
__DEVICE__ float cyl_bessel_i1f(float __x)
Definition: __clang_hip_math.h:374

fmodf
__DEVICE__ float fmodf(float __x, float __y)
Definition: __clang_hip_math.h:427

log1pf
__DEVICE__ float log1pf(float __x)
Definition: __clang_hip_math.h:492

atan2f
__DEVICE__ float atan2f(float __x, float __y)
Definition: __clang_hip_math.h:344

copysignf
__DEVICE__ float copysignf(float __x, float __y)
Definition: __clang_hip_math.h:359

j1
__DEVICE__ double j1(double __x)
Definition: __clang_hip_math.h:854

__isnan
__DEVICE__ __RETURN_TYPE __isnan(double __x)
Definition: __clang_hip_math.h:848

rnormf
__DEVICE__ float rnormf(int __dim, const float *__a)
Definition: __clang_hip_math.h:622

rnorm4df
__DEVICE__ float rnorm4df(float __x, float __y, float __z, float __w)
Definition: __clang_hip_math.h:617

__cosf
__DEVICE__ float __cosf(float __x)
Definition: __clang_hip_math.h:158

erff
__DEVICE__ float erff(float __x)
Definition: __clang_hip_math.h:386

atanf
__DEVICE__ float atanf(float __x)
Definition: __clang_hip_math.h:347

rnorm3df
__DEVICE__ float rnorm3df(float __x, float __y, float __z)
Definition: __clang_hip_math.h:612

norm
__DEVICE__ double norm(int __dim, const double *__a)
Definition: __clang_hip_math.h:960

erfcxf
__DEVICE__ float erfcxf(float __x)
Definition: __clang_hip_math.h:383

erfcinvf
__DEVICE__ float erfcinvf(float __x)
Definition: __clang_hip_math.h:380

asinf
__DEVICE__ float asinf(float __x)
Definition: __clang_hip_math.h:338

lroundf
__DEVICE__ long int lroundf(float __x)
Definition: __clang_hip_math.h:507

__fdividef
__DEVICE__ float __fdividef(float __x, float __y)
Definition: __clang_hip_math.h:201

__frsqrt_rn
__DEVICE__ float __frsqrt_rn(float __x)
Definition: __clang_hip_math.h:256

__log2f
__DEVICE__ float __log2f(float __x)
Definition: __clang_hip_math.h:290

norm4df
__DEVICE__ float norm4df(float __x, float __y, float __z, float __w)
Definition: __clang_hip_math.h:556

__isnanf
__DEVICE__ __RETURN_TYPE __isnanf(float __x)
Definition: __clang_hip_math.h:447

__make_mantissa_base10
__DEVICE__ uint64_t __make_mantissa_base10(const char *__tagp __attribute__((nonnull)))
Definition: __clang_hip_math.h:102

jn
__DEVICE__ double jn(int __n, double __x)
Definition: __clang_hip_math.h:857

__exp10f
__DEVICE__ float __exp10f(float __x)
Definition: __clang_hip_math.h:161

__frcp_rn
__DEVICE__ float __frcp_rn(float __x)
Definition: __clang_hip_math.h:252

__DEVICE__
#define __DEVICE__
Definition: __clang_hip_math.h:33

ynf
__DEVICE__ float ynf(int __n, float __x)
Definition: __clang_hip_math.h:708

powf
__DEVICE__ float powf(float __x, float __y)
Definition: __clang_hip_math.h:579

__fsub_rn
__DEVICE__ float __fsub_rn(float __x, float __y)
Definition: __clang_hip_math.h:283

__dadd_rn
__DEVICE__ double __dadd_rn(double __x, double __y)
Definition: __clang_hip_math.h:1153

sinf
__DEVICE__ float sinf(float __x)
Definition: __clang_hip_math.h:678

__tanf
__DEVICE__ float __tanf(float __x)
Definition: __clang_hip_math.h:311

remquof
__DEVICE__ float remquof(float __x, float __y, int *__quo)
Definition: __clang_hip_math.h:593

normcdf
__DEVICE__ double normcdf(double __x)
Definition: __clang_hip_math.h:982

__fsqrt_rn
__DEVICE__ float __fsqrt_rn(float __x)
Definition: __clang_hip_math.h:269

hypotf
__DEVICE__ float hypotf(float __x, float __y)
Definition: __clang_hip_math.h:435

__fmaf_rn
__DEVICE__ float __fmaf_rn(float __x, float __y, float __z)
Definition: __clang_hip_math.h:222

sincosf
__DEVICE__ void sincosf(float __x, float *__sinptr, float *__cosptr)
Definition: __clang_hip_math.h:652

__make_mantissa_base8
__DEVICE__ uint64_t __make_mantissa_base8(const char *__tagp __attribute__((nonnull)))
Definition: __clang_hip_math.h:85

exp10f
__DEVICE__ float exp10f(float __x)
Definition: __clang_hip_math.h:392

y1
__DEVICE__ double y1(double __x)
Definition: __clang_hip_math.h:1109

__FAST_OR_SLOW
#define __FAST_OR_SLOW(fast, slow)
Definition: __clang_hip_math.h:44

fmaxf
__DEVICE__ float fmaxf(float __x, float __y)
Definition: __clang_hip_math.h:421

fminf
__DEVICE__ float fminf(float __x, float __y)
Definition: __clang_hip_math.h:424

erfcinv
__DEVICE__ double erfcinv(double __x)
Definition: __clang_hip_math.h:787

powi
__DEVICE__ double powi(double __x, int __y)
Definition: __clang_hip_math.h:991

logf
__DEVICE__ float logf(float __x)
Definition: __clang_hip_math.h:501

__fadd_rn
__DEVICE__ float __fadd_rn(float __x, float __y)
Definition: __clang_hip_math.h:183

cospi
__DEVICE__ double cospi(double __x)
Definition: __clang_hip_math.h:772

rsqrt
__DEVICE__ double rsqrt(double __x)
Definition: __clang_hip_math.h:1046

erfcf
__DEVICE__ float erfcf(float __x)
Definition: __clang_hip_math.h:377

atanhf
__DEVICE__ float atanhf(float __x)
Definition: __clang_hip_math.h:350

asinhf
__DEVICE__ float asinhf(float __x)
Definition: __clang_hip_math.h:341

__expf
__DEVICE__ float __expf(float __x)
Definition: __clang_hip_math.h:167

norm4d
__DEVICE__ double norm4d(double __x, double __y, double __z, double __w)
Definition: __clang_hip_math.h:977

__RETURN_TYPE
#define __RETURN_TYPE
Definition: __clang_hip_math.h:55

__logf
__DEVICE__ float __logf(float __x)
Definition: __clang_hip_math.h:293

__fma_rn
__DEVICE__ double __fma_rn(double __x, double __y, double __z)
Definition: __clang_hip_math.h:1269

nan
__DEVICE__ double nan(const char *__tagp)
Definition: __clang_hip_math.h:924

rnorm
__DEVICE__ double rnorm(int __dim, const double *__a)
Definition: __clang_hip_math.h:1021

j0f
__DEVICE__ float j0f(float __x)
Definition: __clang_hip_math.h:450

rsqrtf
__DEVICE__ float rsqrtf(float __x)
Definition: __clang_hip_math.h:637

jnf
__DEVICE__ float jnf(int __n, float __x)
Definition: __clang_hip_math.h:456

sinpi
__DEVICE__ double sinpi(double __x)
Definition: __clang_hip_math.h:1088

logbf
__DEVICE__ float logbf(float __x)
Definition: __clang_hip_math.h:498

y0
__DEVICE__ double y0(double __x)
Definition: __clang_hip_math.h:1106

__finite
__DEVICE__ __RETURN_TYPE __finite(double __x)
Definition: __clang_hip_math.h:842

__sincosf
__DEVICE__ void __sincosf(float __x, float *__sinptr, float *__cosptr)
Definition: __clang_hip_math.h:302

yn
__DEVICE__ double yn(int __n, double __x)
Definition: __clang_hip_math.h:1112

rhypotf
__DEVICE__ float rhypotf(float __x, float __y)
Definition: __clang_hip_math.h:606

exp2f
__DEVICE__ float exp2f(float __x)
Definition: __clang_hip_math.h:395

cyl_bessel_i0
__DEVICE__ double cyl_bessel_i0(double __x)
Definition: __clang_hip_math.h:775

powif
__DEVICE__ float powif(float __x, int __y)
Definition: __clang_hip_math.h:582

__ddiv_rn
__DEVICE__ double __ddiv_rn(double __x, double __y)
Definition: __clang_hip_math.h:1175

cyl_bessel_i1
__DEVICE__ double cyl_bessel_i1(double __x)
Definition: __clang_hip_math.h:778

ceilf
__DEVICE__ float ceilf(float __x)
Definition: __clang_hip_math.h:356

rcbrt
__DEVICE__ double rcbrt(double __x)
Definition: __clang_hip_math.h:994

rnorm3d
__DEVICE__ double rnorm3d(double __x, double __y, double __z)
Definition: __clang_hip_math.h:1033

normcdfinvf
__DEVICE__ float normcdfinvf(float __x)
Definition: __clang_hip_math.h:564

norm3df
__DEVICE__ float norm3df(float __x, float __y, float __z)
Definition: __clang_hip_math.h:551

sincos
__DEVICE__ void sincos(double __x, double *__sinptr, double *__cosptr)
Definition: __clang_hip_math.h:1063

__static_assert_type_size_equal
#define __static_assert_type_size_equal(A, B)
Definition: __clang_hip_math.h:79

__signbit
__DEVICE__ __RETURN_TYPE __signbit(double __x)
Definition: __clang_hip_math.h:1057

fdimf
__DEVICE__ float fdimf(float __x, float __y)
Definition: __clang_hip_math.h:407

__dmul_rn
__DEVICE__ double __dmul_rn(double __x, double __y)
Definition: __clang_hip_math.h:1197

normf
__DEVICE__ float normf(int __dim, const float *__a)
Definition: __clang_hip_math.h:567

nearbyintf
__DEVICE__ float nearbyintf(float __x)
Definition: __clang_hip_math.h:543

__make_mantissa
__DEVICE__ uint64_t __make_mantissa(const char *__tagp __attribute__((nonnull)))
Definition: __clang_hip_math.h:140

ilogbf
__DEVICE__ int ilogbf(float __x)
Definition: __clang_hip_math.h:438

floorf
__DEVICE__ float floorf(float __x)
Definition: __clang_hip_math.h:413

sqrtf
__DEVICE__ float sqrtf(float __x)
Definition: __clang_hip_math.h:687

roundf
__DEVICE__ float roundf(float __x)
Definition: __clang_hip_math.h:634

sincospif
__DEVICE__ void sincospif(float __x, float *__sinptr, float *__cosptr)
Definition: __clang_hip_math.h:667

__drcp_rn
__DEVICE__ double __drcp_rn(double __x)
Definition: __clang_hip_math.h:1211

lrintf
__DEVICE__ long int lrintf(float __x)
Definition: __clang_hip_math.h:504

acoshf
__DEVICE__ float acoshf(float __x)
Definition: __clang_hip_math.h:335

modf
__DEVICE__ double modf(double __x, double *__iptr)
Definition: __clang_hip_math.h:911

cosf
__DEVICE__ float cosf(float __x)
Definition: __clang_hip_math.h:362

expf
__DEVICE__ float expf(float __x)
Definition: __clang_hip_math.h:398

nextafterf
__DEVICE__ float nextafterf(float __x, float __y)
Definition: __clang_hip_math.h:546

rnorm4d
__DEVICE__ double rnorm4d(double __x, double __y, double __z, double __w)
Definition: __clang_hip_math.h:1038

llrintf
__DEVICE__ long long int llrintf(float __x)
Definition: __clang_hip_math.h:483

erfcx
__DEVICE__ double erfcx(double __x)
Definition: __clang_hip_math.h:790

fdividef
__DEVICE__ float fdividef(float __x, float __y)
Definition: __clang_hip_math.h:410

rcbrtf
__DEVICE__ float rcbrtf(float __x)
Definition: __clang_hip_math.h:585

exp10
__DEVICE__ double exp10(double __x)
Definition: __clang_hip_math.h:799

__log10f
__DEVICE__ float __log10f(float __x)
Definition: __clang_hip_math.h:287

cbrtf
__DEVICE__ float cbrtf(float __x)
Definition: __clang_hip_math.h:353

__fmul_rn
__DEVICE__ float __fmul_rn(float __x, float __y)
Definition: __clang_hip_math.h:238

sincospi
__DEVICE__ void sincospi(double __x, double *__sinptr, double *__cosptr)
Definition: __clang_hip_math.h:1074

scalblnf
__DEVICE__ float scalblnf(float __x, long int __n)
Definition: __clang_hip_math.h:640

__isinf
__DEVICE__ __RETURN_TYPE __isinf(double __x)
Definition: __clang_hip_math.h:845

rintf
__DEVICE__ float rintf(float __x)
Definition: __clang_hip_math.h:609

normcdff
__DEVICE__ float normcdff(float __x)
Definition: __clang_hip_math.h:561

__make_mantissa_base16
__DEVICE__ uint64_t __make_mantissa_base16(const char *__tagp __attribute__((nonnull)))
Definition: __clang_hip_math.h:119

__saturatef
__DEVICE__ float __saturatef(float __x)
Definition: __clang_hip_math.h:299

__powf
__DEVICE__ float __powf(float __x, float __y)
Definition: __clang_hip_math.h:296

__host__
#define __host__
Definition: __llvm_offload.h:12

__device__
#define __device__
Definition: __llvm_offload.h:13

__y
static __inline__ uint32_t uint32_t __y
Definition: arm_acle.h:130

__a
static __inline__ void int __a
Definition: emmintrin.h:4079

limits.h

INT_MAX
#define INT_MAX
Definition: limits.h:50

clang::T
const FunctionProtoType * T
Definition: RecursiveASTVisitor.h:1364

sign
float __ovld __cnfn sign(float)
Returns 1.0 if x > 0, -0.0 if x = -0.0, +0.0 if x = +0.0, or -1.0 if x < 0.

true
#define true
Definition: stdbool.h:25

stdint.h

sinh
#define sinh(__x)
Definition: tgmath.h:373

asin
#define asin(__x)
Definition: tgmath.h:112

scalbln
#define scalbln(__x, __y)
Definition: tgmath.h:1182

sqrt
#define sqrt(__x)
Definition: tgmath.h:520

acos
#define acos(__x)
Definition: tgmath.h:83

fmin
#define fmin(__x, __y)
Definition: tgmath.h:780

exp
#define exp(__x)
Definition: tgmath.h:431

ilogb
#define ilogb(__x)
Definition: tgmath.h:851

copysign
#define copysign(__x, __y)
Definition: tgmath.h:618

erf
#define erf(__x)
Definition: tgmath.h:636

atanh
#define atanh(__x)
Definition: tgmath.h:228

remquo
#define remquo(__x, __y, __z)
Definition: tgmath.h:1111

nextafter
#define nextafter(__x, __y)
Definition: tgmath.h:1055

frexp
#define frexp(__x, __y)
Definition: tgmath.h:816

asinh
#define asinh(__x)
Definition: tgmath.h:199

erfc
#define erfc(__x)
Definition: tgmath.h:653

atan2
#define atan2(__x, __y)
Definition: tgmath.h:566

hypot
#define hypot(__x, __y)
Definition: tgmath.h:833

exp2
#define exp2(__x)
Definition: tgmath.h:670

sin
#define sin(__x)
Definition: tgmath.h:286

cbrt
#define cbrt(__x)
Definition: tgmath.h:584

log2
#define log2(__x)
Definition: tgmath.h:970

llround
#define llround(__x)
Definition: tgmath.h:919

cosh
#define cosh(__x)
Definition: tgmath.h:344

trunc
#define trunc(__x)
Definition: tgmath.h:1216

fmax
#define fmax(__x, __y)
Definition: tgmath.h:762

ldexp
#define ldexp(__x, __y)
Definition: tgmath.h:868

acosh
#define acosh(__x)
Definition: tgmath.h:170

tgamma
#define tgamma(__x)
Definition: tgmath.h:1199

scalbn
#define scalbn(__x, __y)
Definition: tgmath.h:1165

round
#define round(__x)
Definition: tgmath.h:1148

fmod
#define fmod(__x, __y)
Definition: tgmath.h:798

llrint
#define llrint(__x)
Definition: tgmath.h:902

tan
#define tan(__x)
Definition: tgmath.h:315

cos
#define cos(__x)
Definition: tgmath.h:257

log10
#define log10(__x)
Definition: tgmath.h:936

fabs
#define fabs(__x)
Definition: tgmath.h:549

pow
#define pow(__x, __y)
Definition: tgmath.h:490

log1p
#define log1p(__x)
Definition: tgmath.h:953

rint
#define rint(__x)
Definition: tgmath.h:1131

expm1
#define expm1(__x)
Definition: tgmath.h:687

remainder
#define remainder(__x, __y)
Definition: tgmath.h:1090

fdim
#define fdim(__x, __y)
Definition: tgmath.h:704

lgamma
#define lgamma(__x)
Definition: tgmath.h:885

tanh
#define tanh(__x)
Definition: tgmath.h:402

lrint
#define lrint(__x)
Definition: tgmath.h:1004

atan
#define atan(__x)
Definition: tgmath.h:141

floor
#define floor(__x)
Definition: tgmath.h:722

ceil
#define ceil(__x)
Definition: tgmath.h:601

log
#define log(__x)
Definition: tgmath.h:460

logb
#define logb(__x)
Definition: tgmath.h:987

nearbyint
#define nearbyint(__x)
Definition: tgmath.h:1038

lround
#define lround(__x)
Definition: tgmath.h:1021

fma
#define fma(__x, __y, __z)
Definition: tgmath.h:742