/* ************************************************************************ * Copyright 2016-2021 Advanced Micro Devices, Inc. * * ************************************************************************ */ #include "testing_trsm_batched_ex.hpp" #include "testing_trsm_ex.hpp" #include "testing_trsm_strided_batched_ex.hpp" #include "utility.h" #include #include #include using ::testing::Combine; using ::testing::TestWithParam; using ::testing::Values; using ::testing::ValuesIn; using namespace std; // only GCC/VS 2010 comes with std::tr1::tuple, but it is unnecessary, std::tuple is good enough; typedef std::tuple, vector, vector, double, int, bool> trsm_ex_tuple; /* ===================================================================== README: This file contains testers to verify the correctness of BLAS routines with google test It is supposed to be played/used by advance / expert users Normal users only need to get the library routines without testers =================================================================== */ /* ===================================================================== Advance users only: BrainStorm the parameters but do not make artificial one which invalidates the matrix. like lda pairs with M, and "lda must >= M". case "lda < M" will be guarded by argument-checkers inside API of course. Yet, the goal of this file is to verify result correctness not argument-checkers. Representative sampling is sufficient, endless brute-force sampling is not necessary =================================================================== */ // vector of vector, each vector is a {M, N, lda, ldb}; // add/delete as a group const vector> full_matrix_size_range = { {192, 192, 192, 192}, {640, 640, 960, 960}, // {1000, 1000, 1000, 1000}, // {2000, 2000, 2000, 2000}, }; const vector> alpha_range = {{1.0, -5.0}}; // vector of vector, each pair is a {side, uplo, transA, diag}; // side has two option "Lefe (L), Right (R)" // uplo has two "Lower (L), Upper (U)" // transA has three ("Nontranspose (N), conjTranspose(C), transpose (T)") // for single/double precision, 'C'(conjTranspose) will downgraded to 'T' (transpose) automatically // in strsm/dtrsm, // so we use 'C' // Diag has two options ("Non-unit (N), Unit (U)") // Each letter is capitalizied, e.g. do not use 'l', but use 'L' instead. const vector> side_uplo_transA_diag_range = { {'L', 'L', 'N', 'N'}, {'R', 'L', 'N', 'N'}, {'L', 'U', 'C', 'N'}, }; const vector stride_scale_range = {2.5}; const vector batch_count_range = {-1, 0, 1, 2}; const bool is_fortran[] = {false, true}; /* ===============Google Unit Test==================================================== */ /* ===================================================================== BLAS-3 trsm: =================================================================== */ /* ============================Setup Arguments======================================= */ // Please use "class Arguments" (see utility.hpp) to pass parameters to templated testers; // Some routines may not touch/use certain "members" of objects "argus". // like BLAS-1 Scal does not have lda, BLAS-2 GEMV does not have ldb, ldc; // That is fine. These testers & routines will leave untouched members alone. // Do not use std::tuple to directly pass parameters to testers // by std:tuple, you have unpack it with extreme care for each one by like "std::get<0>" which is // not intuitive and error-prone Arguments setup_trsm_ex_arguments(trsm_ex_tuple tup) { vector matrix_size = std::get<0>(tup); vector alpha_alphai = std::get<1>(tup); vector side_uplo_transA_diag = std::get<2>(tup); double stride_scale = std::get<3>(tup); int batch_count = std::get<4>(tup); bool fortran = std::get<5>(tup); Arguments arg; // see the comments about matrix_size_range above arg.M = matrix_size[0]; arg.N = matrix_size[1]; arg.lda = matrix_size[2]; arg.ldb = matrix_size[3]; arg.alpha = alpha_alphai[0]; arg.alphai = alpha_alphai[1]; arg.side_option = side_uplo_transA_diag[0]; arg.uplo_option = side_uplo_transA_diag[1]; arg.transA_option = side_uplo_transA_diag[2]; arg.diag_option = side_uplo_transA_diag[3]; arg.timing = 0; arg.stride_scale = stride_scale; arg.batch_count = batch_count; arg.fortran = fortran; return arg; } class trsm_ex_gtest : public ::TestWithParam { protected: trsm_ex_gtest() {} virtual ~trsm_ex_gtest() {} virtual void SetUp() {} virtual void TearDown() {} }; #ifndef __HIP_PLATFORM_NVCC__ TEST_P(trsm_ex_gtest, trsm_ex_gtest_float) { // GetParam return a tuple. Tee setup routine unpack the tuple // and initializes arg(Arguments) which will be passed to testing routine // The Arguments data struture have physical meaning associated. // while the tuple is non-intuitive. Arguments arg = setup_trsm_ex_arguments(GetParam()); arg.compute_type = HIPBLAS_R_32F; hipblasStatus_t status = testing_trsm_ex(arg); // if not success, then the input argument is problematic, so detect the error message if(status != HIPBLAS_STATUS_SUCCESS) { if(arg.M < 0 || arg.N < 0) { EXPECT_EQ(HIPBLAS_STATUS_INVALID_VALUE, status); } else if(arg.side_option == 'L' ? arg.lda < arg.M : arg.lda < arg.N) { EXPECT_EQ(HIPBLAS_STATUS_INVALID_VALUE, status); } else if(arg.ldb < arg.M) { EXPECT_EQ(HIPBLAS_STATUS_INVALID_VALUE, status); } else { EXPECT_EQ(HIPBLAS_STATUS_SUCCESS, status); // fail } } } TEST_P(trsm_ex_gtest, trsm_gtest_ex_double_complex) { // GetParam return a tuple. Tee setup routine unpack the tuple // and initializes arg(Arguments) which will be passed to testing routine // The Arguments data struture have physical meaning associated. // while the tuple is non-intuitive. Arguments arg = setup_trsm_ex_arguments(GetParam()); arg.compute_type = HIPBLAS_C_64F; hipblasStatus_t status = testing_trsm_ex(arg); // if not success, then the input argument is problematic, so detect the error message if(status != HIPBLAS_STATUS_SUCCESS) { if(arg.M < 0 || arg.N < 0 || arg.ldb < arg.M || (arg.side_option == 'L' ? arg.lda < arg.M : arg.lda < arg.N)) { EXPECT_EQ(HIPBLAS_STATUS_INVALID_VALUE, status); } else { EXPECT_EQ(HIPBLAS_STATUS_SUCCESS, status); // fail } } } TEST_P(trsm_ex_gtest, trsm_batched_ex_gtest_float) { // GetParam return a tuple. Tee setup routine unpack the tuple // and initializes arg(Arguments) which will be passed to testing routine // The Arguments data struture have physical meaning associated. // while the tuple is non-intuitive. Arguments arg = setup_trsm_ex_arguments(GetParam()); arg.compute_type = HIPBLAS_R_32F; hipblasStatus_t status = testing_trsm_batched_ex(arg); // if not success, then the input argument is problematic, so detect the error message if(status != HIPBLAS_STATUS_SUCCESS) { if(arg.M < 0 || arg.N < 0 || arg.lda < arg.K || arg.ldb < arg.M || (arg.side_option == 'L' ? arg.lda < arg.M : arg.lda < arg.N) || arg.batch_count < 0) { EXPECT_EQ(HIPBLAS_STATUS_INVALID_VALUE, status); } else { EXPECT_EQ(HIPBLAS_STATUS_SUCCESS, status); // fail } } } TEST_P(trsm_ex_gtest, trsm_batched_ex_gtest_double_complex) { // GetParam return a tuple. Tee setup routine unpack the tuple // and initializes arg(Arguments) which will be passed to testing routine // The Arguments data struture have physical meaning associated. // while the tuple is non-intuitive. Arguments arg = setup_trsm_ex_arguments(GetParam()); arg.compute_type = HIPBLAS_C_64F; hipblasStatus_t status = testing_trsm_batched_ex(arg); // if not success, then the input argument is problematic, so detect the error message if(status != HIPBLAS_STATUS_SUCCESS) { if(arg.M < 0 || arg.N < 0 || arg.lda < arg.K || arg.ldb < arg.M || (arg.side_option == 'L' ? arg.lda < arg.M : arg.lda < arg.N) || arg.batch_count < 0) { EXPECT_EQ(HIPBLAS_STATUS_INVALID_VALUE, status); } else { EXPECT_EQ(HIPBLAS_STATUS_SUCCESS, status); // fail } } } TEST_P(trsm_ex_gtest, trsm_strided_batched_ex_gtest_float) { // GetParam return a tuple. Tee setup routine unpack the tuple // and initializes arg(Arguments) which will be passed to testing routine // The Arguments data struture have physical meaning associated. // while the tuple is non-intuitive. Arguments arg = setup_trsm_ex_arguments(GetParam()); arg.compute_type = HIPBLAS_R_32F; hipblasStatus_t status = testing_trsm_strided_batched_ex(arg); // if not success, then the input argument is problematic, so detect the error message if(status != HIPBLAS_STATUS_SUCCESS) { if(arg.M < 0 || arg.N < 0 || arg.ldb < arg.M || (arg.side_option == 'L' ? arg.lda < arg.M : arg.lda < arg.N) || arg.batch_count < 0) { EXPECT_EQ(HIPBLAS_STATUS_INVALID_VALUE, status); } else { EXPECT_EQ(HIPBLAS_STATUS_SUCCESS, status); // fail } } } TEST_P(trsm_ex_gtest, trsm_strided_batched_ex_gtest_double_complex) { // GetParam return a tuple. Tee setup routine unpack the tuple // and initializes arg(Arguments) which will be passed to testing routine // The Arguments data struture have physical meaning associated. // while the tuple is non-intuitive. Arguments arg = setup_trsm_ex_arguments(GetParam()); arg.compute_type = HIPBLAS_C_64F; hipblasStatus_t status = testing_trsm_strided_batched_ex(arg); // if not success, then the input argument is problematic, so detect the error message if(status != HIPBLAS_STATUS_SUCCESS) { if(arg.M < 0 || arg.N < 0 || arg.ldb < arg.M || (arg.side_option == 'L' ? arg.lda < arg.M : arg.lda < arg.N) || arg.batch_count < 0) { EXPECT_EQ(HIPBLAS_STATUS_INVALID_VALUE, status); } else { EXPECT_EQ(HIPBLAS_STATUS_SUCCESS, status); // fail } } } // notice we are using vector of vector // so each elment in xxx_range is a avector, // ValuesIn take each element (a vector) and combine them and feed them to test_p // The combinations are { {M, N, lda, ldb}, alpha, {side, uplo, transA, diag} } // THis function mainly test the scope of matrix_size. the scope of side_uplo_transA_diag_range is // small // Testing order: side_uplo_transA_xx first, alpha_range second, full_matrix_size last // i.e fix the matrix size and alpha, test all the side_uplo_transA_xx first. INSTANTIATE_TEST_SUITE_P(hipblasTrsm_matrix_size, trsm_ex_gtest, Combine(ValuesIn(full_matrix_size_range), ValuesIn(alpha_range), ValuesIn(side_uplo_transA_diag_range), ValuesIn(stride_scale_range), ValuesIn(batch_count_range), ValuesIn(is_fortran))); #endif