Skip to content
Snippets Groups Projects
Commit 67c202e9 authored by yaskovet's avatar yaskovet
Browse files

Move parallel primitives lib: moderngpu to CUB (define GPU_HOST_DEVICE)

parent 92e2df9a
No related branches found
No related tags found
No related merge requests found
Pipeline #5905 failed
......@@ -15,6 +15,7 @@
#include <type_traits>
#define CUDA_ON_BACKEND CUDA_BACKEND_ALPAKA
#define GPU_HOST_DEVICE
extern alpa_base_structs __alpa_base__;
......
......@@ -13,6 +13,10 @@ constexpr int default_kernel_wg_threads_ = 1024;
#ifdef __NVCC__
#include "operators.hpp"
#ifndef GPU_HOST_DEVICE
#define GPU_HOST_DEVICE __forceinline__ __device__ __host__
#endif
template<typename lambda_f>
__global__ void kernel_launch_lambda(lambda_f f)
{
......
......@@ -11,6 +11,7 @@ constexpr int default_kernel_wg_threads_ = 1024;
#define CUDA_ON_BACKEND CUDA_BACKEND_OPENMP
#define GPU_HOST_DEVICE
#include "util/cudify/cudify_hardware_cpu.hpp"
......
......@@ -2,6 +2,7 @@
#define CUDIFY_SEQUENCIAL_HPP_
#define CUDA_ON_BACKEND CUDA_BACKEND_SEQUENTIAL
#define GPU_HOST_DEVICE
#include "config.h"
......@@ -103,6 +104,7 @@ static T atomicAdd(T * address, T2 val)
return old;
};
namespace gpu
{
template<typename type_t>
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment