/* ************************************************************************ * Copyright 2018-2019 Advanced Micro Devices, Inc. * ************************************************************************ */ #ifndef ROCBLAS_MATH_H_ #define ROCBLAS_MATH_H_ #include "rocblas.h" #include #include #include #include /* ============================================================================================ */ // Helper function to truncate float to bfloat16 inline __host__ rocblas_bfloat16 float_to_bfloat16_truncate(float val) { union { float fp32; uint32_t int32; } u = {val}; rocblas_bfloat16 ret; ret.data = uint16_t(u.int32 >> 16); if((u.int32 & 0x7fff0000) == 0x7f800000 && u.int32 & 0xffff) ret.data |= 1; // Preserve signaling NaN return ret; } /* ============================================================================================ */ /*! \brief returns true if value is NaN */ template {}, int>::type = 0> inline bool rocblas_isnan(T) { return false; } template {} && !is_complex, int>::type = 0> inline bool rocblas_isnan(T arg) { return std::isnan(arg); } template , int>::type = 0> inline bool rocblas_isnan(const T& arg) { return rocblas_isnan(std::real(arg)) || rocblas_isnan(std::imag(arg)); } inline bool rocblas_isnan(rocblas_half arg) { union { rocblas_half fp; uint16_t data; } x = {arg}; return (~x.data & 0x7c00) == 0 && (x.data & 0x3ff) != 0; } /* ============================================================================================ */ /*! \brief negate a value */ template inline T negate(T x) { return -x; } template <> inline rocblas_half negate(rocblas_half arg) { union { rocblas_half fp; uint16_t data; } x = {arg}; x.data ^= 0x8000; return x.fp; } template <> inline rocblas_bfloat16 negate(rocblas_bfloat16 x) { x.data ^= 0x8000; return x; } #endif