|
27 | 27 | #define GPUCA_WARP_SIZE 64 |
28 | 28 | #define GPUCA_PAR_AMD_EUS_PER_CU 4 |
29 | 29 | #define GPUCA_THREAD_COUNT_DEFAULT 256 |
30 | | - #define GPUCA_LB_GPUTPCCreateTrackingData 256 |
31 | | - #define GPUCA_LB_GPUTPCStartHitsSorter 512, 1 |
32 | | - #define GPUCA_LB_GPUTPCStartHitsFinder 1024 |
33 | | - #define GPUCA_LB_GPUTPCTrackletConstructor 512, 2 |
34 | | - #define GPUCA_LB_GPUTPCTrackletSelector 192, 3 |
35 | | - #define GPUCA_LB_GPUTPCNeighboursFinder 1024, 1 |
36 | | - #define GPUCA_LB_GPUTPCNeighboursCleaner 896 |
37 | | - #define GPUCA_LB_GPUTPCExtrapolationTracking 256 |
| 30 | + #define GPUCA_LB_GPUTPCCreateTrackingData 256, 7 |
| 31 | + #define GPUCA_LB_GPUTPCStartHitsSorter 1024, 5 |
| 32 | + #define GPUCA_LB_GPUTPCStartHitsFinder 1024, 2 |
| 33 | + #define GPUCA_LB_GPUTPCTrackletConstructor 768, 8 |
| 34 | + #define GPUCA_LB_GPUTPCTrackletSelector 384, 5 |
| 35 | + #define GPUCA_LB_GPUTPCNeighboursFinder 192, 8 |
| 36 | + #define GPUCA_LB_GPUTPCNeighboursCleaner 128, 5 |
| 37 | + #define GPUCA_LB_GPUTPCExtrapolationTracking 256, 7 |
38 | 38 | #define GPUCA_LB_GPUTPCCFDecodeZS 64, 4 |
39 | 39 | #define GPUCA_LB_GPUTPCCFDecodeZSLink GPUCA_WARP_SIZE |
40 | | - #define GPUCA_LB_GPUTPCCFDecodeZSDenseLink GPUCA_WARP_SIZE |
41 | | - #define GPUCA_LB_GPUTPCCFGather 1024, 1 |
42 | | - #define GPUCA_LB_GPUTPCGMMergerTrackFit 128, 1 |
43 | | - #define GPUCA_LB_GPUTPCGMMergerFollowLoopers 64, 12 |
44 | | - #define GPUCA_LB_GPUTPCGMMergerSectorRefit 256 |
| 40 | + #define GPUCA_LB_GPUTPCCFDecodeZSDenseLink GPUCA_WARP_SIZE, 4 |
| 41 | + #define GPUCA_LB_GPUTPCCFGather 1024, 5 |
| 42 | + #define GPUCA_LB_GPUTPCGMMergerTrackFit 192, 2 |
| 43 | + #define GPUCA_LB_GPUTPCGMMergerFollowLoopers 256, 5 |
| 44 | + #define GPUCA_LB_GPUTPCGMMergerSectorRefit 64, 4 |
45 | 45 | #define GPUCA_LB_GPUTPCGMMergerUnpackResetIds 256 |
46 | 46 | #define GPUCA_LB_GPUTPCGMMergerUnpackGlobal 256 |
47 | 47 | #define GPUCA_LB_GPUTPCGMMergerResolve_step0 512 |
|
56 | 56 | #define GPUCA_LB_GPUTPCGMMergerMergeBorders_step2 512 |
57 | 57 | #define GPUCA_LB_GPUTPCGMMergerMergeCE 512 |
58 | 58 | #define GPUCA_LB_GPUTPCGMMergerLinkExtrapolatedTracks 256 |
59 | | - #define GPUCA_LB_GPUTPCGMMergerCollect 512 |
| 59 | + #define GPUCA_LB_GPUTPCGMMergerCollect 768, 1 |
60 | 60 | #define GPUCA_LB_GPUTPCGMMergerSortTracksPrepare 256 |
61 | 61 | #define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step0 256 |
62 | 62 | #define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step1 256 |
63 | 63 | #define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step2 256 |
64 | 64 | #define GPUCA_LB_GPUTPCGMMergerFinalize_0 256 |
65 | 65 | #define GPUCA_LB_GPUTPCGMMergerFinalize_1 256 |
66 | 66 | #define GPUCA_LB_GPUTPCGMMergerFinalize_2 256 |
67 | | - #define GPUCA_LB_GPUTPCCompressionKernels_step0attached 64, 2 |
| 67 | + #define GPUCA_LB_GPUTPCCompressionKernels_step0attached 128, 1 |
68 | 68 | #define GPUCA_LB_GPUTPCCompressionKernels_step1unattached 512, 2 |
69 | 69 | #define GPUCA_LB_GPUTPCDecompressionKernels_step0attached 128, 2 |
70 | 70 | #define GPUCA_LB_GPUTPCDecompressionKernels_step1unattached 64, 2 |
71 | | - #define GPUCA_LB_GPUTPCCFCheckPadBaseline 64 |
| 71 | + #define GPUCA_LB_GPUTPCCFCheckPadBaseline 64, 10 |
72 | 72 | #define GPUCA_LB_GPUTPCCFChargeMapFiller_fillIndexMap 512 |
73 | 73 | #define GPUCA_LB_GPUTPCCFChargeMapFiller_fillFromDigits 512 |
74 | 74 | #define GPUCA_LB_GPUTPCCFChargeMapFiller_findFragmentStart 512 |
75 | | - #define GPUCA_LB_GPUTPCCFPeakFinder 512 |
| 75 | + #define GPUCA_LB_GPUTPCCFPeakFinder 512, 9 |
76 | 76 | #define GPUCA_LB_GPUTPCCFNoiseSuppression 512 |
77 | | - #define GPUCA_LB_GPUTPCCFDeconvolution 512 |
78 | | - #define GPUCA_LB_GPUTPCCFClusterizer 448 |
| 77 | + #define GPUCA_LB_GPUTPCCFDeconvolution 512, 5 |
| 78 | + #define GPUCA_LB_GPUTPCCFClusterizer 448, 3 |
79 | 79 | #define GPUCA_LB_COMPRESSION_GATHER 1024 |
80 | | - #define GPUCA_PAR_NEIGHBOURS_FINDER_MAX_NNEIGHUP 5 |
81 | | - #define GPUCA_PAR_TRACKLET_SELECTOR_HITS_REG_SIZE 20 |
| 80 | + #define GPUCA_PAR_NEIGHBOURS_FINDER_MAX_NNEIGHUP 10 |
| 81 | + #define PAR_NEIGHBOURS_FINDER_UNROLL_GLOBAL 4 |
| 82 | + #define GPUCA_PAR_NEIGHBOURS_FINDER_UNROLL_SHARED 0 |
| 83 | + #define GPUCA_PAR_TRACKLET_SELECTOR_HITS_REG_SIZE 9 |
82 | 84 | #define GPUCA_PAR_ALTERNATE_BORDER_SORT 1 |
83 | 85 | #define GPUCA_PAR_SORT_BEFORE_FIT 1 |
84 | 86 | #define GPUCA_PAR_NO_ATOMIC_PRECHECK 1 |
|
90 | 92 | #define GPUCA_WARP_SIZE 64 |
91 | 93 | #define GPUCA_PAR_AMD_EUS_PER_CU 4 |
92 | 94 | #define GPUCA_THREAD_COUNT_DEFAULT 256 |
93 | | - #define GPUCA_LB_GPUTPCCreateTrackingData 128 |
94 | | - #define GPUCA_LB_GPUTPCStartHitsSorter 1024, 2 |
95 | | - #define GPUCA_LB_GPUTPCStartHitsFinder 1024 |
96 | | - #define GPUCA_LB_GPUTPCTrackletConstructor 256, 2 |
97 | | - #define GPUCA_LB_GPUTPCTrackletSelector 256, 8 |
98 | | - #define GPUCA_LB_GPUTPCNeighboursFinder 1024, 1 |
99 | | - #define GPUCA_LB_GPUTPCNeighboursCleaner 896 |
100 | | - #define GPUCA_LB_GPUTPCExtrapolationTracking 256 |
101 | | - #define GPUCA_LB_GPUTPCCFDecodeZS 64, 4 |
| 95 | + #define GPUCA_LB_GPUTPCCreateTrackingData 192, 2 |
| 96 | + #define GPUCA_LB_GPUTPCStartHitsSorter 512, 7 |
| 97 | + #define GPUCA_LB_GPUTPCStartHitsFinder 1024, 7 |
| 98 | + #define GPUCA_LB_GPUTPCTrackletConstructor 512, 10 |
| 99 | + #define GPUCA_LB_GPUTPCTrackletSelector 192, 10 |
| 100 | + #define GPUCA_LB_GPUTPCNeighboursFinder 960, 8 |
| 101 | + #define GPUCA_LB_GPUTPCNeighboursCleaner 384, 9 |
| 102 | + #define GPUCA_LB_GPUTPCExtrapolationTracking 256, 2 |
| 103 | + #define GPUCA_LB_GPUTPCCFDecodeZS 64, 1 |
102 | 104 | #define GPUCA_LB_GPUTPCCFDecodeZSLink GPUCA_WARP_SIZE |
103 | | - #define GPUCA_LB_GPUTPCCFDecodeZSDenseLink GPUCA_WARP_SIZE |
| 105 | + #define GPUCA_LB_GPUTPCCFDecodeZSDenseLink GPUCA_WARP_SIZE, 14 |
104 | 106 | #define GPUCA_LB_GPUTPCCFGather 1024, 1 |
105 | | - #define GPUCA_LB_GPUTPCGMMergerTrackFit 64, 1 |
106 | | - #define GPUCA_LB_GPUTPCGMMergerFollowLoopers 256, 4, 200 |
107 | | - #define GPUCA_LB_GPUTPCGMMergerSectorRefit 256 |
| 107 | + #define GPUCA_LB_GPUTPCGMMergerTrackFit 64, 7 |
| 108 | + #define GPUCA_LB_GPUTPCGMMergerFollowLoopers 256, 5 |
| 109 | + #define GPUCA_LB_GPUTPCGMMergerSectorRefit 256, 2 |
108 | 110 | #define GPUCA_LB_GPUTPCGMMergerUnpackResetIds 256 |
109 | 111 | #define GPUCA_LB_GPUTPCGMMergerUnpackGlobal 256 |
110 | 112 | #define GPUCA_LB_GPUTPCGMMergerResolve_step0 256 |
|
119 | 121 | #define GPUCA_LB_GPUTPCGMMergerMergeBorders_step2 256 |
120 | 122 | #define GPUCA_LB_GPUTPCGMMergerMergeCE 256 |
121 | 123 | #define GPUCA_LB_GPUTPCGMMergerLinkExtrapolatedTracks 256 |
122 | | - #define GPUCA_LB_GPUTPCGMMergerCollect 512 |
| 124 | + #define GPUCA_LB_GPUTPCGMMergerCollect 1024, 1 |
123 | 125 | #define GPUCA_LB_GPUTPCGMMergerSortTracksPrepare 256 |
124 | 126 | #define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step0 256 |
125 | 127 | #define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step1 256 |
126 | 128 | #define GPUCA_LB_GPUTPCGMMergerPrepareForFit_step2 256 |
127 | 129 | #define GPUCA_LB_GPUTPCGMMergerFinalize_0 256 |
128 | 130 | #define GPUCA_LB_GPUTPCGMMergerFinalize_1 256 |
129 | 131 | #define GPUCA_LB_GPUTPCGMMergerFinalize_2 256 |
130 | | - #define GPUCA_LB_GPUTPCCompressionKernels_step0attached 192, 2 |
| 132 | + #define GPUCA_LB_GPUTPCCompressionKernels_step0attached 64, 2 |
131 | 133 | #define GPUCA_LB_GPUTPCCompressionKernels_step1unattached 512, 2 |
132 | 134 | #define GPUCA_LB_GPUTPCDecompressionKernels_step0attached 128, 2 |
133 | 135 | #define GPUCA_LB_GPUTPCDecompressionKernels_step1unattached 64, 2 |
134 | | - #define GPUCA_LB_GPUTPCCFCheckPadBaseline 64 |
| 136 | + #define GPUCA_LB_GPUTPCCFCheckPadBaseline 64, 2 |
135 | 137 | #define GPUCA_LB_GPUTPCCFChargeMapFiller_fillIndexMap 512 |
136 | 138 | #define GPUCA_LB_GPUTPCCFChargeMapFiller_fillFromDigits 512 |
137 | 139 | #define GPUCA_LB_GPUTPCCFChargeMapFiller_findFragmentStart 512 |
138 | | - #define GPUCA_LB_GPUTPCCFPeakFinder 512 |
| 140 | + #define GPUCA_LB_GPUTPCCFPeakFinder 512, 4 |
139 | 141 | #define GPUCA_LB_GPUTPCCFNoiseSuppression 512 |
140 | | - #define GPUCA_LB_GPUTPCCFDeconvolution 512 |
141 | | - #define GPUCA_LB_GPUTPCCFClusterizer 512 |
| 142 | + #define GPUCA_LB_GPUTPCCFDeconvolution 512, 5 |
| 143 | + #define GPUCA_LB_GPUTPCCFClusterizer 512, 2 |
142 | 144 | #define GPUCA_LB_COMPRESSION_GATHER 1024 |
143 | | - #define GPUCA_PAR_NEIGHBOURS_FINDER_MAX_NNEIGHUP 5 |
144 | | - #define GPUCA_PAR_TRACKLET_SELECTOR_HITS_REG_SIZE 20 |
| 145 | + #define GPUCA_PAR_NEIGHBOURS_FINDER_MAX_NNEIGHUP 4 |
| 146 | + #define GPUCA_PAR_NEIGHBOURS_FINDER_UNROLL_GLOBAL 2 |
| 147 | + #define GPUCA_PAR_NEIGHBOURS_FINDER_UNROLL_SHARED 0 |
| 148 | + #define GPUCA_PAR_TRACKLET_SELECTOR_HITS_REG_SIZE 27 |
145 | 149 | #define GPUCA_PAR_ALTERNATE_BORDER_SORT 1 |
146 | 150 | #define GPUCA_PAR_SORT_BEFORE_FIT 1 |
147 | 151 | #define GPUCA_PAR_NO_ATOMIC_PRECHECK 1 |
|
0 commit comments