15#ifndef GPUCOMMONALGORITHMTHRUST_H
16#define GPUCOMMONALGORITHMTHRUST_H
18#ifndef GPUCA_GPUCODE_COMPILEKERNELS
19#pragma GCC diagnostic push
20#pragma GCC diagnostic ignored "-Wshadow"
21#include <thrust/sort.h>
22#include <thrust/execution_policy.h>
23#include <thrust/device_ptr.h>
24#pragma GCC diagnostic pop
32#include <hipcub/hipcub.hpp>
37#define GPUCA_THRUST_NAMESPACE thrust::cuda
38#define GPUCA_CUB_NAMESPACE cub
40#define GPUCA_THRUST_NAMESPACE thrust::hip
41#define GPUCA_CUB_NAMESPACE hipcub
84GPUdi()
void GPUCommonAlgorithm::sortDeviceDynamic(T* begin, T*
end)
86 thrust::device_ptr<T> thrustBegin(
begin);
87 thrust::device_ptr<T> thrustEnd(
end);
88 thrust::sort(GPUCA_THRUST_NAMESPACE::par, thrustBegin, thrustEnd);
91template <
class T,
class S>
92GPUdi()
void GPUCommonAlgorithm::sortDeviceDynamic(T* begin, T*
end,
const S& comp)
94 thrust::device_ptr<T> thrustBegin(
begin);
95 thrust::device_ptr<T> thrustEnd(
end);
96 thrust::sort(GPUCA_THRUST_NAMESPACE::par, thrustBegin, thrustEnd,
comp);
99#ifndef GPUCA_GPUCODE_COMPILEKERNELS
100template <
class T,
class S>
103 thrust::device_ptr<T> p(begin);
106 thrust::sort(GPUCA_THRUST_NAMESPACE::par(alloc).on(
rec->mInternals->Streams[
stream]), p, p + N, comp);
109 void* tempMem =
nullptr;
110 GPUChkErrS(GPUCA_CUB_NAMESPACE::DeviceMergeSort::SortKeys(tempMem, tempSize, begin, N, comp,
rec->mInternals->Streams[
stream]));
112 GPUChkErrS(GPUCA_CUB_NAMESPACE::DeviceMergeSort::SortKeys(tempMem, tempSize, begin, N, comp,
rec->mInternals->Streams[
stream]));
119#undef GPUCA_THRUST_NAMESPACE
120#undef GPUCA_CUB_NAMESPACE
ThrustVolatileAllocator getThrustVolatileDeviceAllocator()
void * AllocateVolatileDeviceMemory(size_t size)
typedef void(APIENTRYP PFNGLCULLFACEPROC)(GLenum mode)
GPUhi() void GPUCommonAlgorithm