// RUN: %hc %s -o %t.out && %t.out #include #include // added for checking HSA profile #include // test C++AMP with fine-grained SVM // requires HSA Full Profile to operate successfully #define SIZE (16) using namespace hc; // test supply a template class with operator() to parallel_for_each template class prog { _Tp (&input)[N]; public: prog(_Tp (&t)[N]) [[cpu, hc]] : input(t) { } void operator() (hc::index<1>& idx) [[hc]] { input[idx[0]] = idx[0]; } void run() { parallel_for_each(extent<1>(N), *this); } // verify output bool test() { bool ret = true; for (int i = 0; i < N; ++i) { if (input[i] != i) { ret = false; break; } } return true; } }; int main() { bool ret = true; // only conduct the test in case we are running on a HSA full profile stack hc::accelerator acc; if (acc.is_hsa_accelerator() && acc.get_profile() == hc::hcAgentProfileFull) { // prepare test data int input_int[SIZE] { 0 }; unsigned input_unsigned[SIZE] { 0 }; float input_float[SIZE] { 0 }; double input_double[SIZE] { 0 }; // launch kernel prog p1(input_int); p1.run(); prog p2(input_unsigned); p2.run(); prog p3(input_float); p3.run(); prog p4(input_double); p4.run(); // check result ret &= p1.test(); ret &= p2.test(); ret &= p3.test(); ret &= p4.test(); } return !(ret == true); }