/* ************************************************************************ * Copyright 2016 Advanced Micro Devices, Inc. * * ************************************************************************ */ #include #include #include #include "cblas_interface.h" #include "hipblas.hpp" #include "near.h" #include "norm.h" #include "utility.h" #include using namespace std; /* ============================================================================================ */ template hipblasStatus_t testing_rotg_strided_batched(Arguments arg) { double stride_scale = arg.stride_scale; int stride_a = stride_scale; int stride_b = stride_scale; int stride_c = stride_scale; int stride_s = stride_scale; int batch_count = arg.batch_count; hipblasStatus_t status_1 = HIPBLAS_STATUS_SUCCESS; hipblasStatus_t status_2 = HIPBLAS_STATUS_SUCCESS; hipblasStatus_t status_3 = HIPBLAS_STATUS_SUCCESS; hipblasStatus_t status_4 = HIPBLAS_STATUS_SUCCESS; hipblasHandle_t handle; hipblasCreate(&handle); const U rel_error = std::numeric_limits::epsilon() * 1000; // check to prevent undefined memory allocation error if(batch_count == 0) { hipblasDestroy(handle); return HIPBLAS_STATUS_SUCCESS; } else if(batch_count < 0) { hipblasDestroy(handle); return HIPBLAS_STATUS_INVALID_VALUE; } size_t size_a = size_t(stride_a) * size_t(batch_count); size_t size_b = size_t(stride_b) * size_t(batch_count); size_t size_c = size_t(stride_c) * size_t(batch_count); size_t size_s = size_t(stride_s) * size_t(batch_count); host_vector ha(size_a); host_vector hb(size_b); host_vector hc(size_c); host_vector hs(size_s); // Initial data on CPU srand(1); hipblas_init(ha, 1, 1, 1, stride_a, batch_count); hipblas_init(hb, 1, 1, 1, stride_b, batch_count); hipblas_init(hc, 1, 1, 1, stride_c, batch_count); hipblas_init(hs, 1, 1, 1, stride_s, batch_count); // CPU_BLAS host_vector ca = ha; host_vector cb = hb; host_vector cc = hc; host_vector cs = hs; for(int b = 0; b < batch_count; b++) { cblas_rotg(ca.data() + b * stride_a, cb.data() + b * stride_b, cc.data() + b * stride_c, cs.data() + b * stride_s); } // Test host { host_vector ra = ha; host_vector rb = hb; host_vector rc = hc; host_vector rs = hs; status_1 = hipblasSetPointerMode(handle, HIPBLAS_POINTER_MODE_HOST); status_2 = ((hipblasRotgStridedBatched( handle, ra, stride_a, rb, stride_b, rc, stride_c, rs, stride_s, batch_count))); if((status_1 != HIPBLAS_STATUS_SUCCESS) || (status_2 != HIPBLAS_STATUS_SUCCESS)) { hipblasDestroy(handle); if(status_1 != HIPBLAS_STATUS_SUCCESS) return status_1; if(status_2 != HIPBLAS_STATUS_SUCCESS) return status_2; } if(arg.unit_check) { near_check_general(1, 1, batch_count, 1, stride_a, ca, ra, rel_error); near_check_general(1, 1, batch_count, 1, stride_b, cb, rb, rel_error); near_check_general(1, 1, batch_count, 1, stride_c, cc, rc, rel_error); near_check_general(1, 1, batch_count, 1, stride_s, cs, rs, rel_error); } } // Test device { device_vector da(size_a); device_vector db(size_b); device_vector dc(size_c); device_vector ds(size_s); CHECK_HIP_ERROR(hipMemcpy(da, ha, sizeof(T) * size_a, hipMemcpyHostToDevice)); CHECK_HIP_ERROR(hipMemcpy(db, hb, sizeof(T) * size_b, hipMemcpyHostToDevice)); CHECK_HIP_ERROR(hipMemcpy(dc, hc, sizeof(U) * size_c, hipMemcpyHostToDevice)); CHECK_HIP_ERROR(hipMemcpy(ds, hs, sizeof(T) * size_s, hipMemcpyHostToDevice)); status_3 = hipblasSetPointerMode(handle, HIPBLAS_POINTER_MODE_DEVICE); status_4 = ((hipblasRotgStridedBatched( handle, da, stride_a, db, stride_b, dc, stride_c, ds, stride_s, batch_count))); if((status_3 != HIPBLAS_STATUS_SUCCESS) || (status_4 != HIPBLAS_STATUS_SUCCESS)) { hipblasDestroy(handle); if(status_3 != HIPBLAS_STATUS_SUCCESS) return status_3; if(status_4 != HIPBLAS_STATUS_SUCCESS) return status_4; } host_vector ra(size_a); host_vector rb(size_b); host_vector rc(size_c); host_vector rs(size_s); CHECK_HIP_ERROR(hipMemcpy(ra, da, sizeof(T) * size_a, hipMemcpyDeviceToHost)); CHECK_HIP_ERROR(hipMemcpy(rb, db, sizeof(T) * size_b, hipMemcpyDeviceToHost)); CHECK_HIP_ERROR(hipMemcpy(rc, dc, sizeof(U) * size_c, hipMemcpyDeviceToHost)); CHECK_HIP_ERROR(hipMemcpy(rs, ds, sizeof(T) * size_s, hipMemcpyDeviceToHost)); if(arg.unit_check) { near_check_general(1, 1, batch_count, 1, stride_a, ca, ra, rel_error); near_check_general(1, 1, batch_count, 1, stride_b, cb, rb, rel_error); near_check_general(1, 1, batch_count, 1, stride_c, cc, rc, rel_error); near_check_general(1, 1, batch_count, 1, stride_s, cs, rs, rel_error); } } hipblasDestroy(handle); return HIPBLAS_STATUS_SUCCESS; }