91 template <typename Scalar, typename BaseVector>
94 Size =
sizeof(BaseVector) /
sizeof(Scalar),
100 template <
int32_t iKernel = defaultKernel>
103 template <typename T, typename
S>
106 template <typename T>
109 template <typename Scalar, typename Vector>
112 template <typename T>
115 template <typename V, typename T, typename
S>
116 GPUdi() static
void compressorMemcpyBuffered(V*
buf, T*
dst, const T*
src, const
S* nums, const uint32_t* srcOffets, uint32_t nEntries, int32_t nLanes, int32_t iLane, int32_t diff = 0,
size_t scaleBase1024 = 1024);
118 template <typename T>
119 GPUdi() static uint32_t calculateWarpOffsets(
GPUSharedMemory& smem, T* nums, uint32_t
start, uint32_t
end, int32_t nWarps, int32_t iWarp, int32_t nLanes, int32_t iLane);
121 template <typename V>