// MIT License // // Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved. // // Permission is hereby granted, free of charge, to any person obtaining a copy // of this software and associated documentation files (the "Software"), to deal // in the Software without restriction, including without limitation the rights // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell // copies of the Software, and to permit persons to whom the Software is // furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in all // copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE // SOFTWARE. #ifndef HIPCUB_TEST_HIPCUB_TEST_UTILS_DATA_GENERATION_HPP_ #define HIPCUB_TEST_HIPCUB_TEST_UTILS_DATA_GENERATION_HPP_ // Std::memcpy and std::memcmp #include #include "test_utils_half.hpp" #include "test_utils_bfloat16.hpp" #include "test_utils_custom_test_types.hpp" namespace test_utils { // Numeric limits which also supports custom_test_type classes template struct numeric_limits : std::numeric_limits { }; template<> struct numeric_limits : public std::numeric_limits { public: using T = test_utils::half; static inline T min() { return T(0.00006104f); }; static inline T max() { return T(65504.0f); }; static inline T lowest() { return T(-65504.0f); }; static inline T infinity() { return T(std::numeric_limits::infinity()); }; static inline T quiet_NaN() { return T(std::numeric_limits::quiet_NaN()); }; static inline T signaling_NaN() { return T(std::numeric_limits::signaling_NaN()); }; }; template<> class numeric_limits : public std::numeric_limits { public: using T = test_utils::bfloat16; static inline T max() { return T(3.38953138925e+38f); }; static inline T min() { return T(std::numeric_limits::min()); }; static inline T lowest() { return T(-3.38953138925e+38f); }; static inline T infinity() { return T(std::numeric_limits::infinity()); }; static inline T quiet_NaN() { return T(std::numeric_limits::quiet_NaN()); }; static inline T signaling_NaN() { return T(std::numeric_limits::signaling_NaN()); }; }; // End of extended numeric_limits // Helper class to generate a vector of special values for any type template struct special_values { private: // sign_bit_flip needed because host-side operators for __half are missing. (e.g. -__half unary operator or (-1*) __half*__half binary operator static T sign_bit_flip(T value){ uint8_t* data = reinterpret_cast(&value); data[sizeof(T)-1] ^= 0x80; return value; } public: static std::vector vector(){ if(std::is_integral::value){ return std::vector(); }else { std::vector r = {test_utils::numeric_limits::quiet_NaN(), //sign_bit_flip(test_utils::numeric_limits::quiet_NaN()), // TODO: fix AMD issue with -NaN //test_utils::numeric_limits::signaling_NaN(), // signaling_NaN not supported on NVIDIA yet //sign_bit_flip(test_utils::numeric_limits::signaling_NaN()), test_utils::numeric_limits::infinity(), sign_bit_flip(test_utils::numeric_limits::infinity()), T(0.0), T(-0.0)}; return r; } } }; // end of special_values helpers /// Insert special values of type T at a random place in the source vector /// \tparam T /// \param source The source vector to modify template void add_special_values(std::vector& source, int seed_value) { std::default_random_engine gen(seed_value); std::vector special_values = test_utils::special_values::vector(); if(source.size() > special_values.size()) { unsigned int start = gen() % (source.size() - special_values.size()); std::copy(special_values.begin(), special_values.end(), source.begin() + start); } } // std::uniform_int_distribution is undefined for anything other than // short, int, long, long long, unsigned short, unsigned int, unsigned long, or unsigned long long. // Actually causes problems with signed/unsigned char on Windows using clang. template struct is_valid_for_int_distribution : std::integral_constant::value || std::is_same::value || std::is_same::value || std::is_same::value || std::is_same::value || std::is_same::value || std::is_same::value || std::is_same::value > {}; template inline auto get_random_data(size_t size, T min, T max, int seed_value) -> typename std::enable_if::value, std::vector>::type { std::default_random_engine gen(seed_value); using dis_type = typename std::conditional< is_valid_for_int_distribution::value, T, typename std::conditional::value, int, unsigned int>::type >::type; std::uniform_int_distribution distribution(static_cast(min), static_cast(max)); std::vector data(size); std::generate(data.begin(), data.end(), [&]() { return distribution(gen); }); return data; } template inline auto get_random_data(size_t size, S min, U max, int seed_value) -> typename std::enable_if::value && !is_custom_test_type::value, std::vector>::type { std::default_random_engine gen(seed_value); using dis_type = typename std::conditional::value || std::is_same::value, float, T>::type; std::uniform_real_distribution distribution(static_cast(min), static_cast(max)); std::vector data(size); std::generate( data.begin(), data.end(), [&]() { return static_cast(distribution(gen)); } ); return data; } template inline auto get_random_data(size_t size, typename T::value_type min, typename T::value_type max, int seed_value) -> typename std::enable_if< is_custom_test_type::value && std::is_integral::value, std::vector >::type { std::default_random_engine gen(seed_value); using dis_type = typename std::conditional< is_valid_for_int_distribution::value, typename T::value_type, typename std::conditional::value, int, unsigned int>::type >::type; std::uniform_int_distribution distribution(static_cast(min), static_cast(max)); std::vector data(size); std::generate(data.begin(), data.end(), [&]() { return T(distribution(gen), distribution(gen)); }); return data; } template inline auto get_random_data(size_t size, typename T::value_type min, typename T::value_type max, int seed_value) -> typename std::enable_if< is_custom_test_type::value && std::is_floating_point::value, std::vector >::type { std::default_random_engine gen(seed_value); std::uniform_real_distribution distribution(min, max); std::vector data(size); std::generate(data.begin(), data.end(), [&]() { return T(distribution(gen), distribution(gen)); }); return data; } template inline auto get_random_value(T min, T max, int seed_value) -> typename std::enable_if::value, T>::type { return get_random_data(1, min, max, seed_value)[0]; } template inline std::vector get_random_data01(size_t size, float p, int seed_value) { const size_t max_random_size = 1024 * 1024; std::default_random_engine gen(seed_value); std::bernoulli_distribution distribution(p); std::vector data(size); std::generate( data.begin(), data.begin() + std::min(size, max_random_size), [&]() { return distribution(gen); } ); for(size_t i = max_random_size; i < size; i += max_random_size) { std::copy_n(data.begin(), std::min(size - i, max_random_size), data.begin() + i); } return data; } } // end test_utils namespace #endif // HIPCUB_TEST_HIPCUB_TEST_UTILS_DATA_GENERATION_HPP_