Skip to content

Commit 099c111

Browse files
cima22davidrohr
authored andcommitted
GPU TPC: update optimal AMD default parameters for PbPb data
1 parent 490589c commit 099c111

File tree

1 file changed

+46
-42
lines changed

1 file changed

+46
-42
lines changed

GPU/GPUTracking/Definitions/GPUDefParametersDefaults.h

Lines changed: 46 additions & 42 deletions
Original file line numberDiff line numberDiff line change
@@ -27,21 +27,21 @@
2727
#define GPUCA_WARP_SIZE 64
2828
#define GPUCA_PAR_AMD_EUS_PER_CU 4
2929
#define GPUCA_THREAD_COUNT_DEFAULT 256
30-
#define GPUCA_LB_GPUTPCCreateTrackingData 256
31-
#define GPUCA_LB_GPUTPCStartHitsSorter 512, 1
32-
#define GPUCA_LB_GPUTPCStartHitsFinder 1024
33-
#define GPUCA_LB_GPUTPCTrackletConstructor 512, 2
34-
#define GPUCA_LB_GPUTPCTrackletSelector 192, 3
35-
#define GPUCA_LB_GPUTPCNeighboursFinder 1024, 1
36-
#define GPUCA_LB_GPUTPCNeighboursCleaner 896
37-
#define GPUCA_LB_GPUTPCExtrapolationTracking 256
30+
#define GPUCA_LB_GPUTPCCreateTrackingData 256, 7
31+
#define GPUCA_LB_GPUTPCStartHitsSorter 1024, 5
32+
#define GPUCA_LB_GPUTPCStartHitsFinder 1024, 2
33+
#define GPUCA_LB_GPUTPCTrackletConstructor 768, 8
34+
#define GPUCA_LB_GPUTPCTrackletSelector 384, 5
35+
#define GPUCA_LB_GPUTPCNeighboursFinder 192, 8
36+
#define GPUCA_LB_GPUTPCNeighboursCleaner 128, 5
37+
#define GPUCA_LB_GPUTPCExtrapolationTracking 256, 7
3838
#define GPUCA_LB_GPUTPCCFDecodeZS 64, 4
3939
#define GPUCA_LB_GPUTPCCFDecodeZSLink GPUCA_WARP_SIZE
40-
#define GPUCA_LB_GPUTPCCFDecodeZSDenseLink GPUCA_WARP_SIZE
41-
#define GPUCA_LB_GPUTPCCFGather 1024, 1
42-
#define GPUCA_LB_GPUTPCGMMergerTrackFit 128, 1
43-
#define GPUCA_LB_GPUTPCGMMergerFollowLoopers 64, 12
44-
#define GPUCA_LB_GPUTPCGMMergerSectorRefit 256
40+
#define GPUCA_LB_GPUTPCCFDecodeZSDenseLink GPUCA_WARP_SIZE, 4
41+
#define GPUCA_LB_GPUTPCCFGather 1024, 5
42+
#define GPUCA_LB_GPUTPCGMMergerTrackFit 192, 2
43+
#define GPUCA_LB_GPUTPCGMMergerFollowLoopers 256, 5
44+
#define GPUCA_LB_GPUTPCGMMergerSectorRefit 64, 4
4545
#define GPUCA_LB_GPUTPCGMMergerUnpackResetIds 256
4646
#define GPUCA_LB_GPUTPCGMMergerUnpackGlobal 256
4747
#define GPUCA_LB_GPUTPCGMMergerResolve_step0 512
@@ -56,29 +56,31 @@
5656
#define GPUCA_LB_GPUTPCGMMergerMergeBorders_step2 512
5757
#define GPUCA_LB_GPUTPCGMMergerMergeCE 512
5858
#define GPUCA_LB_GPUTPCGMMergerLinkExtrapolatedTracks 256
59-
#define GPUCA_LB_GPUTPCGMMergerCollect 512
59+
#define GPUCA_LB_GPUTPCGMMergerCollect 768, 1
6060
#define GPUCA_LB_GPUTPCGMMergerSortTracksPrepare 256
6161
#define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step0 256
6262
#define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step1 256
6363
#define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step2 256
6464
#define GPUCA_LB_GPUTPCGMMergerFinalize_0 256
6565
#define GPUCA_LB_GPUTPCGMMergerFinalize_1 256
6666
#define GPUCA_LB_GPUTPCGMMergerFinalize_2 256
67-
#define GPUCA_LB_GPUTPCCompressionKernels_step0attached 64, 2
67+
#define GPUCA_LB_GPUTPCCompressionKernels_step0attached 128, 1
6868
#define GPUCA_LB_GPUTPCCompressionKernels_step1unattached 512, 2
6969
#define GPUCA_LB_GPUTPCDecompressionKernels_step0attached 128, 2
7070
#define GPUCA_LB_GPUTPCDecompressionKernels_step1unattached 64, 2
71-
#define GPUCA_LB_GPUTPCCFCheckPadBaseline 64
71+
#define GPUCA_LB_GPUTPCCFCheckPadBaseline 64, 10
7272
#define GPUCA_LB_GPUTPCCFChargeMapFiller_fillIndexMap 512
7373
#define GPUCA_LB_GPUTPCCFChargeMapFiller_fillFromDigits 512
7474
#define GPUCA_LB_GPUTPCCFChargeMapFiller_findFragmentStart 512
75-
#define GPUCA_LB_GPUTPCCFPeakFinder 512
75+
#define GPUCA_LB_GPUTPCCFPeakFinder 512, 9
7676
#define GPUCA_LB_GPUTPCCFNoiseSuppression 512
77-
#define GPUCA_LB_GPUTPCCFDeconvolution 512
78-
#define GPUCA_LB_GPUTPCCFClusterizer 448
77+
#define GPUCA_LB_GPUTPCCFDeconvolution 512, 5
78+
#define GPUCA_LB_GPUTPCCFClusterizer 448, 3
7979
#define GPUCA_LB_COMPRESSION_GATHER 1024
80-
#define GPUCA_PAR_NEIGHBOURS_FINDER_MAX_NNEIGHUP 5
81-
#define GPUCA_PAR_TRACKLET_SELECTOR_HITS_REG_SIZE 20
80+
#define GPUCA_PAR_NEIGHBOURS_FINDER_MAX_NNEIGHUP 10
81+
#define PAR_NEIGHBOURS_FINDER_UNROLL_GLOBAL 4
82+
#define GPUCA_PAR_NEIGHBOURS_FINDER_UNROLL_SHARED 0
83+
#define GPUCA_PAR_TRACKLET_SELECTOR_HITS_REG_SIZE 9
8284
#define GPUCA_PAR_ALTERNATE_BORDER_SORT 1
8385
#define GPUCA_PAR_SORT_BEFORE_FIT 1
8486
#define GPUCA_PAR_NO_ATOMIC_PRECHECK 1
@@ -90,21 +92,21 @@
9092
#define GPUCA_WARP_SIZE 64
9193
#define GPUCA_PAR_AMD_EUS_PER_CU 4
9294
#define GPUCA_THREAD_COUNT_DEFAULT 256
93-
#define GPUCA_LB_GPUTPCCreateTrackingData 128
94-
#define GPUCA_LB_GPUTPCStartHitsSorter 1024, 2
95-
#define GPUCA_LB_GPUTPCStartHitsFinder 1024
96-
#define GPUCA_LB_GPUTPCTrackletConstructor 256, 2
97-
#define GPUCA_LB_GPUTPCTrackletSelector 256, 8
98-
#define GPUCA_LB_GPUTPCNeighboursFinder 1024, 1
99-
#define GPUCA_LB_GPUTPCNeighboursCleaner 896
100-
#define GPUCA_LB_GPUTPCExtrapolationTracking 256
101-
#define GPUCA_LB_GPUTPCCFDecodeZS 64, 4
95+
#define GPUCA_LB_GPUTPCCreateTrackingData 192, 2
96+
#define GPUCA_LB_GPUTPCStartHitsSorter 512, 7
97+
#define GPUCA_LB_GPUTPCStartHitsFinder 1024, 7
98+
#define GPUCA_LB_GPUTPCTrackletConstructor 512, 10
99+
#define GPUCA_LB_GPUTPCTrackletSelector 192, 10
100+
#define GPUCA_LB_GPUTPCNeighboursFinder 960, 8
101+
#define GPUCA_LB_GPUTPCNeighboursCleaner 384, 9
102+
#define GPUCA_LB_GPUTPCExtrapolationTracking 256, 2
103+
#define GPUCA_LB_GPUTPCCFDecodeZS 64, 1
102104
#define GPUCA_LB_GPUTPCCFDecodeZSLink GPUCA_WARP_SIZE
103-
#define GPUCA_LB_GPUTPCCFDecodeZSDenseLink GPUCA_WARP_SIZE
105+
#define GPUCA_LB_GPUTPCCFDecodeZSDenseLink GPUCA_WARP_SIZE, 14
104106
#define GPUCA_LB_GPUTPCCFGather 1024, 1
105-
#define GPUCA_LB_GPUTPCGMMergerTrackFit 64, 1
106-
#define GPUCA_LB_GPUTPCGMMergerFollowLoopers 256, 4, 200
107-
#define GPUCA_LB_GPUTPCGMMergerSectorRefit 256
107+
#define GPUCA_LB_GPUTPCGMMergerTrackFit 64, 7
108+
#define GPUCA_LB_GPUTPCGMMergerFollowLoopers 256, 5
109+
#define GPUCA_LB_GPUTPCGMMergerSectorRefit 256, 2
108110
#define GPUCA_LB_GPUTPCGMMergerUnpackResetIds 256
109111
#define GPUCA_LB_GPUTPCGMMergerUnpackGlobal 256
110112
#define GPUCA_LB_GPUTPCGMMergerResolve_step0 256
@@ -119,29 +121,31 @@
119121
#define GPUCA_LB_GPUTPCGMMergerMergeBorders_step2 256
120122
#define GPUCA_LB_GPUTPCGMMergerMergeCE 256
121123
#define GPUCA_LB_GPUTPCGMMergerLinkExtrapolatedTracks 256
122-
#define GPUCA_LB_GPUTPCGMMergerCollect 512
124+
#define GPUCA_LB_GPUTPCGMMergerCollect 1024, 1
123125
#define GPUCA_LB_GPUTPCGMMergerSortTracksPrepare 256
124126
#define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step0 256
125127
#define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step1 256
126128
#define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step2 256
127129
#define GPUCA_LB_GPUTPCGMMergerFinalize_0 256
128130
#define GPUCA_LB_GPUTPCGMMergerFinalize_1 256
129131
#define GPUCA_LB_GPUTPCGMMergerFinalize_2 256
130-
#define GPUCA_LB_GPUTPCCompressionKernels_step0attached 192, 2
132+
#define GPUCA_LB_GPUTPCCompressionKernels_step0attached 64, 2
131133
#define GPUCA_LB_GPUTPCCompressionKernels_step1unattached 512, 2
132134
#define GPUCA_LB_GPUTPCDecompressionKernels_step0attached 128, 2
133135
#define GPUCA_LB_GPUTPCDecompressionKernels_step1unattached 64, 2
134-
#define GPUCA_LB_GPUTPCCFCheckPadBaseline 64
136+
#define GPUCA_LB_GPUTPCCFCheckPadBaseline 64, 2
135137
#define GPUCA_LB_GPUTPCCFChargeMapFiller_fillIndexMap 512
136138
#define GPUCA_LB_GPUTPCCFChargeMapFiller_fillFromDigits 512
137139
#define GPUCA_LB_GPUTPCCFChargeMapFiller_findFragmentStart 512
138-
#define GPUCA_LB_GPUTPCCFPeakFinder 512
140+
#define GPUCA_LB_GPUTPCCFPeakFinder 512, 4
139141
#define GPUCA_LB_GPUTPCCFNoiseSuppression 512
140-
#define GPUCA_LB_GPUTPCCFDeconvolution 512
141-
#define GPUCA_LB_GPUTPCCFClusterizer 512
142+
#define GPUCA_LB_GPUTPCCFDeconvolution 512, 5
143+
#define GPUCA_LB_GPUTPCCFClusterizer 512, 2
142144
#define GPUCA_LB_COMPRESSION_GATHER 1024
143-
#define GPUCA_PAR_NEIGHBOURS_FINDER_MAX_NNEIGHUP 5
144-
#define GPUCA_PAR_TRACKLET_SELECTOR_HITS_REG_SIZE 20
145+
#define GPUCA_PAR_NEIGHBOURS_FINDER_MAX_NNEIGHUP 4
146+
#define GPUCA_PAR_NEIGHBOURS_FINDER_UNROLL_GLOBAL 2
147+
#define GPUCA_PAR_NEIGHBOURS_FINDER_UNROLL_SHARED 0
148+
#define GPUCA_PAR_TRACKLET_SELECTOR_HITS_REG_SIZE 27
145149
#define GPUCA_PAR_ALTERNATE_BORDER_SORT 1
146150
#define GPUCA_PAR_SORT_BEFORE_FIT 1
147151
#define GPUCA_PAR_NO_ATOMIC_PRECHECK 1

0 commit comments

Comments
 (0)