@@ -72,15 +72,19 @@ class GPUTPCCompressionGatherKernels : public GPUKernelTemplate
7272 using Vec64 = uint64_t ;
7373 using Vec128 = uint4;
7474
75- struct GPUSharedMemory : public GPUKernelTemplate ::GPUSharedMemoryScan64<uint32_t , GPUCA_GET_THREAD_COUNT(GPUCA_LB_COMPRESSION_GATHER)> {
75+ static_assert (GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered) == GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_buffered32));
76+ static_assert (GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered) == GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_buffered64));
77+ static_assert (GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered) == GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_buffered128));
78+ static_assert (GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered) == GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_multiBlock));
79+ struct GPUSharedMemory : public GPUKernelTemplate ::GPUSharedMemoryScan64<uint32_t , GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered)> {
7680 union {
77- uint32_t warpOffset[GPUCA_GET_WARP_COUNT (GPUCA_LB_COMPRESSION_GATHER )];
78- Vec32 buf32[GPUCA_GET_WARP_COUNT (GPUCA_LB_COMPRESSION_GATHER )][GPUCA_WARP_SIZE];
79- Vec64 buf64[GPUCA_GET_WARP_COUNT (GPUCA_LB_COMPRESSION_GATHER )][GPUCA_WARP_SIZE];
80- Vec128 buf128[GPUCA_GET_WARP_COUNT (GPUCA_LB_COMPRESSION_GATHER )][GPUCA_WARP_SIZE];
81+ uint32_t warpOffset[GPUCA_GET_WARP_COUNT (GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered )];
82+ Vec32 buf32[GPUCA_GET_WARP_COUNT (GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered )][GPUCA_WARP_SIZE];
83+ Vec64 buf64[GPUCA_GET_WARP_COUNT (GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered )][GPUCA_WARP_SIZE];
84+ Vec128 buf128[GPUCA_GET_WARP_COUNT (GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered )][GPUCA_WARP_SIZE];
8185 struct {
82- uint32_t sizes[GPUCA_GET_WARP_COUNT(GPUCA_LB_COMPRESSION_GATHER )][GPUCA_WARP_SIZE];
83- uint32_t srcOffsets[GPUCA_GET_WARP_COUNT(GPUCA_LB_COMPRESSION_GATHER )][GPUCA_WARP_SIZE];
86+ uint32_t sizes[GPUCA_GET_WARP_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered )][GPUCA_WARP_SIZE];
87+ uint32_t srcOffsets[GPUCA_GET_WARP_COUNT(GPUCA_LB_GPUTPCCompressionGatherKernels_unbuffered )][GPUCA_WARP_SIZE];
8488 } unbuffered;
8589 };
8690
0 commit comments