scan.hpp reduce.hpp tf::detail::cudaScanResult tf::detail::cudaScanResult< T, vt, true > tf::detail::cudaBlockScan tf::detail::cudaBlockScan::storage_t tf tf::detail CUDA scan algorithm include file.