// Copyright (c) 2018 Advanced Micro Devices, Inc. All rights reserved. // // Permission is hereby granted, free of charge, to any person obtaining a copy // of this software and associated documentation files (the "Software"), to deal // in the Software without restriction, including without limitation the rights // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell // copies of the Software, and to permit persons to whom the Software is // furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in // all copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN // THE SOFTWARE. #ifndef ROCPRIM_TEST_TEST_UTILS_HPP_ #define ROCPRIM_TEST_TEST_UTILS_HPP_ #include #include #include #include #include // hipCUB #include namespace test_utils { template inline auto get_random_data(size_t size, T min, T max) -> typename std::enable_if::value, std::vector>::type { std::random_device rd; std::default_random_engine gen(rd()); std::uniform_int_distribution distribution(min, max); std::vector data(size); std::generate(data.begin(), data.end(), [&]() { return distribution(gen); }); return data; } template inline auto get_random_data(size_t size, T min, T max) -> typename std::enable_if::value, std::vector>::type { std::random_device rd; std::default_random_engine gen(rd()); std::uniform_real_distribution distribution(min, max); std::vector data(size); std::generate(data.begin(), data.end(), [&]() { return distribution(gen); }); return data; } template inline std::vector get_random_data01(size_t size, float p) { const size_t max_random_size = 1024 * 1024; std::random_device rd; std::default_random_engine gen(rd()); std::bernoulli_distribution distribution(p); std::vector data(size); std::generate( data.begin(), data.begin() + std::min(size, max_random_size), [&]() { return distribution(gen); } ); for(size_t i = max_random_size; i < size; i += max_random_size) { std::copy_n(data.begin(), std::min(size - i, max_random_size), data.begin() + i); } return data; } template inline auto get_random_value(T min, T max) -> typename std::enable_if::value, T>::type { return get_random_data(1, min, max)[0]; } // Can't use std::prefix_sum for inclusive/exclusive scan, because // it does not handle short[] -> int(int a, int b) { a + b; } -> int[] // they way we expect. That's because sum in std::prefix_sum's implementation // is of type typename std::iterator_traits::value_type (short) template OutputIt host_inclusive_scan(InputIt first, InputIt last, OutputIt d_first, BinaryOperation op) { using input_type = typename std::iterator_traits::value_type; using output_type = typename std::iterator_traits::value_type; using result_type = typename std::conditional< std::is_void::value, input_type, output_type >::type; if (first == last) return d_first; result_type sum = *first; *d_first = sum; while (++first != last) { sum = op(sum, static_cast(*first)); *++d_first = sum; } return ++d_first; } template OutputIt host_exclusive_scan(InputIt first, InputIt last, T initial_value, OutputIt d_first, BinaryOperation op) { using input_type = typename std::iterator_traits::value_type; using output_type = typename std::iterator_traits::value_type; using result_type = typename std::conditional< std::is_void::value, input_type, output_type >::type; if (first == last) return d_first; result_type sum = initial_value; *d_first = initial_value; while ((first+1) != last) { sum = op(sum, static_cast(*first)); *++d_first = sum; first++; } return ++d_first; } template OutputIt host_exclusive_scan_by_key(InputIt first, InputIt last, KeyIt k_first, T initial_value, OutputIt d_first, BinaryOperation op, KeyCompare key_compare_op) { using input_type = typename std::iterator_traits::value_type; using output_type = typename std::iterator_traits::value_type; using result_type = typename std::conditional< std::is_void::value, input_type, output_type >::type; if (first == last) return d_first; result_type sum = initial_value; *d_first = initial_value; while ((first+1) != last) { if(key_compare_op(*k_first, *++k_first)) { sum = op(sum, static_cast(*first)); } else { sum = initial_value; } *++d_first = sum; first++; } return ++d_first; } HIPCUB_HOST_DEVICE inline constexpr unsigned int warp_size() { return HIPCUB_WARP_THREADS; } template HIPCUB_HOST_DEVICE inline constexpr T max(const T& a, const T& b) { return a < b ? b : a; } template HIPCUB_HOST_DEVICE inline constexpr T min(const T& a, const T& b) { return a < b ? a : b; } template HIPCUB_HOST_DEVICE inline constexpr bool is_power_of_two(const T x) { static_assert(std::is_integral::value, "T must be integer type"); return (x > 0) && ((x & (x - 1)) == 0); } template HIPCUB_HOST_DEVICE inline constexpr T next_power_of_two(const T x, const T acc = 1) { static_assert(std::is_unsigned::value, "T must be unsigned type"); return acc >= x ? acc : next_power_of_two(x, 2 * acc); } // Return thread id in a "logical warp", which can be smaller than a hardware warp size. template HIPCUB_DEVICE inline auto logical_lane_id() -> typename std::enable_if::type { return hipcub::LaneId() & (LogicalWarpSize-1); // same as land_id()%WarpSize } template HIPCUB_DEVICE inline auto logical_lane_id() -> typename std::enable_if::type { return hipcub::LaneId()%LogicalWarpSize; } template<> HIPCUB_DEVICE inline unsigned int logical_lane_id() { return hipcub::LaneId(); } // Return id of "logical warp" in a block template HIPCUB_DEVICE inline unsigned int logical_warp_id() { return hipcub::RowMajorTid(1, 1, 1)/LogicalWarpSize; } template<> HIPCUB_DEVICE inline unsigned int logical_warp_id() { return hipcub::WarpId(); } inline size_t get_max_block_size() { hipDeviceProp_t device_properties; hipError_t error = hipGetDeviceProperties(&device_properties, 0); if(error != hipSuccess) { std::cout << "HIP error: " << error << " file: " << __FILE__ << " line: " << __LINE__ << std::endl; std::exit(error); } return device_properties.maxThreadsPerBlock; } // Select the minimal warp size for block of size block_size, it's // useful for blocks smaller than maximal warp size. template HIPCUB_HOST_DEVICE inline constexpr T get_min_warp_size(const T block_size, const T max_warp_size) { static_assert(std::is_unsigned::value, "T must be unsigned type"); return block_size >= max_warp_size ? max_warp_size : next_power_of_two(block_size); } template struct custom_test_type { using value_type = T; T x; T y; HIPCUB_HOST_DEVICE inline constexpr custom_test_type() {} HIPCUB_HOST_DEVICE inline constexpr custom_test_type(T x, T y) : x(x), y(y) {} HIPCUB_HOST_DEVICE inline constexpr custom_test_type(T xy) : x(xy), y(xy) {} template HIPCUB_HOST_DEVICE inline custom_test_type(const custom_test_type& other) { x = other.x; y = other.y; } #ifndef HIPCUB_CUB_API HIPCUB_HOST_DEVICE inline ~custom_test_type() = default; #endif HIPCUB_HOST_DEVICE inline custom_test_type& operator=(const custom_test_type& other) { x = other.x; y = other.y; return *this; } HIPCUB_HOST_DEVICE inline custom_test_type operator+(const custom_test_type& other) const { return custom_test_type(x + other.x, y + other.y); } HIPCUB_HOST_DEVICE inline custom_test_type operator-(const custom_test_type& other) const { return custom_test_type(x - other.x, y - other.y); } HIPCUB_HOST_DEVICE inline bool operator<(const custom_test_type& other) const { return (x < other.x || (x == other.x && y < other.y)); } HIPCUB_HOST_DEVICE inline bool operator>(const custom_test_type& other) const { return (x > other.x || (x == other.x && y > other.y)); } HIPCUB_HOST_DEVICE inline bool operator==(const custom_test_type& other) const { return (x == other.x && y == other.y); } HIPCUB_HOST_DEVICE inline bool operator!=(const custom_test_type& other) const { return !(*this == other); } }; template struct is_custom_test_type : std::false_type { }; template struct is_custom_test_type> : std::true_type { }; template inline auto get_random_data(size_t size, typename T::value_type min, typename T::value_type max) -> typename std::enable_if< is_custom_test_type::value && std::is_integral::value, std::vector >::type { std::random_device rd; std::default_random_engine gen(rd()); std::uniform_int_distribution distribution(min, max); std::vector data(size); std::generate(data.begin(), data.end(), [&]() { return T(distribution(gen), distribution(gen)); }); return data; } template inline auto get_random_data(size_t size, typename T::value_type min, typename T::value_type max) -> typename std::enable_if< is_custom_test_type::value && std::is_floating_point::value, std::vector >::type { std::random_device rd; std::default_random_engine gen(rd()); std::uniform_real_distribution distribution(min, max); std::vector data(size); std::generate(data.begin(), data.end(), [&]() { return T(distribution(gen), distribution(gen)); }); return data; } template auto assert_near(const std::vector& result, const std::vector& expected, const float percent) -> typename std::enable_if::value && std::is_arithmetic::value>::type { ASSERT_EQ(result.size(), expected.size()); for(size_t i = 0; i < result.size(); i++) { auto diff = std::max(std::abs(percent * expected[i]), T(percent)); if(std::is_integral::value) diff = 0; ASSERT_NEAR(result[i], expected[i], diff) << "where index = " << i; } } template auto assert_near(const T& result, const T& expected, const float percent) -> typename std::enable_if::value && std::is_arithmetic::value>::type { auto diff = std::max(std::abs(percent * expected), T(percent)); if(std::is_integral::value) diff = 0; ASSERT_NEAR(result, expected, diff); } template auto assert_near(const T& result, const T& expected, const float percent) -> typename std::enable_if::value>::type { using value_type = typename T::value_type; auto diff1 = std::max(std::abs(percent * expected.x), value_type(percent)); auto diff2 = std::max(std::abs(percent * expected.y), value_type(percent)); if(std::is_integral::value) { diff1 = 0; diff2 = 0; } ASSERT_NEAR(result.x, expected.x, diff1); ASSERT_NEAR(result.y, expected.y, diff2); } template auto assert_near(const std::vector& result, const std::vector& expected, const float percent) -> typename std::enable_if::value>::type { using value_type = typename T::value_type; ASSERT_EQ(result.size(), expected.size()); for(size_t i = 0; i < result.size(); i++) { auto diff1 = std::max(std::abs(percent * expected[i].x), value_type(percent)); auto diff2 = std::max(std::abs(percent * expected[i].y), value_type(percent)); if(std::is_integral::value) { diff1 = 0; diff2 = 0; } ASSERT_NEAR(result[i].x, expected[i].x, diff1) << "where index = " << i; ASSERT_NEAR(result[i].y, expected[i].y, diff2) << "where index = " << i; } } template auto assert_near(const std::vector& result, const std::vector& expected, const float) -> typename std::enable_if::value && !std::is_arithmetic::value>::type { ASSERT_EQ(result.size(), expected.size()); for(size_t i = 0; i < result.size(); i++) { ASSERT_EQ(result[i], expected[i]) << "where index = " << i; } } } // end test_util namespace // Need for hipcub::DeviceReduce::Min/Max etc. namespace std { template<> class numeric_limits> { using T = typename test_utils::custom_test_type; public: static constexpr inline T max() { return std::numeric_limits::max(); } static constexpr inline T lowest() { return std::numeric_limits::lowest(); } }; template<> class numeric_limits> { using T = typename test_utils::custom_test_type; public: static constexpr inline T max() { return std::numeric_limits::max(); } static constexpr inline T lowest() { return std::numeric_limits::lowest(); } }; } #endif // ROCPRIM_TEST_HIPCUB_TEST_UTILS_HPP_