Skip to content

Commit 222fa1b

Browse files
committed
GPU: Add comments for customizable kernel parameters
1 parent 5d625cc commit 222fa1b

File tree

1 file changed

+13
-13
lines changed

1 file changed

+13
-13
lines changed

GPU/GPUTracking/kernels.cmake

Lines changed: 13 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -135,17 +135,17 @@ o2_gpu_add_kernel("GPUTPCNNClusterizerKernels, publishClass2Regression" "= TPC
135135
o2_gpu_add_kernel("GPUTPCNNClusterizerKernels, publishDeconvolutionFlags" "= TPCNNCLUSTERFINDER" LB uint8_t sector int8_t dtype int8_t withMC uint32_t batchStart)
136136
endif()
137137

138-
o2_gpu_kernel_add_parameter(NEIGHBOURS_FINDER_MAX_NNEIGHUP
139-
NEIGHBOURS_FINDER_UNROLL_GLOBAL
140-
NEIGHBOURS_FINDER_UNROLL_SHARED
141-
TRACKLET_SELECTOR_HITS_REG_SIZE
142-
ALTERNATE_BORDER_SORT
143-
SORT_BEFORE_FIT
144-
NO_ATOMIC_PRECHECK
145-
COMP_GATHER_KERNEL
146-
COMP_GATHER_MODE
147-
SORT_STARTHITS
148-
CF_SCAN_WORKGROUP_SIZE)
138+
o2_gpu_kernel_add_parameter(NEIGHBOURS_FINDER_MAX_NNEIGHUP # Number of neighhbours finder hits to cache in shared memory
139+
NEIGHBOURS_FINDER_UNROLL_GLOBAL # Unroll factor for neighbours finder iterating hits in local memory
140+
NEIGHBOURS_FINDER_UNROLL_SHARED # Fully unroll iteration over neighbours finder hits in shared memory [0/1]
141+
TRACKLET_SELECTOR_HITS_REG_SIZE # Number of hits to cache in shared memory in tracklet selector
142+
ALTERNATE_BORDER_SORT # Use alternative border sort approach [0/1]
143+
SORT_BEFORE_FIT # Sort tracks after length to reduce warp serialization [0/1]
144+
NO_ATOMIC_PRECHECK # Skip atomic precheck to reduce posterior synchronization [0/1]
145+
COMP_GATHER_KERNEL # Default kernel to use for Compression Gather Operation [0 - 4]
146+
COMP_GATHER_MODE # TPC Compression Gather Mode [0 - 3]
147+
SORT_STARTHITS # Sort start hits to improve cache locality during tracklet construction [0/1]
148+
CF_SCAN_WORKGROUP_SIZE) # Work group size to use in clusterizer scan operation
149149

150-
o2_gpu_kernel_add_string_parameter(DEDX_STORAGE_TYPE
151-
MERGER_INTERPOLATION_ERROR_TYPE)
150+
o2_gpu_kernel_add_string_parameter(DEDX_STORAGE_TYPE # Data type to use for intermediate storage of dEdx truncated mean inputs
151+
MERGER_INTERPOLATION_ERROR_TYPE) # Data type for storing intermediate track residuals for interpolation

0 commit comments

Comments
 (0)