#define DOCTEST_CONFIG_IMPLEMENT_WITH_MAIN #include #include #include #include // ---------------------------------------------------------------------------- // cuda_find_if // ---------------------------------------------------------------------------- template void cuda_find_if() { tf::Taskflow taskflow; tf::Executor executor; for(int n=0; n<=1234567; n = (n<=100) ? n+1 : n*2 + 1) { taskflow.emplace([n](){ tf::cudaStream stream; tf::cudaDefaultExecutionPolicy policy(stream); // gpu data auto gdata = tf::cuda_malloc_shared(n); auto gfind = tf::cuda_malloc_shared(1); // cpu data auto hdata = std::vector(n); // initialize the data for(int i=0; i(); } TEST_CASE("cuda_find_if.float" * doctest::timeout(300)) { cuda_find_if(); }