Skip to content

Commit eebb9e5

Browse files
committed
GPU TPC: Remove option to retry refit if cluster rejection breaks the track, we will anyway rebuild the track in the future
1 parent bfcff02 commit eebb9e5

File tree

7 files changed

+17
-53
lines changed

7 files changed

+17
-53
lines changed

GPU/GPUTracking/Definitions/GPUSettingsList.h

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -155,7 +155,6 @@ AddOptionRTC(mergerInterpolateErrors, uint8_t, 1, "", 0, "Use interpolation inst
155155
AddOptionRTC(mergerInterpolateRejectAlsoOnCurrentPosition, uint8_t, 1, "", 0, "When using mergerInterpolateErrors, reject based on chi2 twice computed with interpolated and current track position starting from NDF > mergerNonInterpolateRejectMinNDF")
156156
AddOptionRTC(mergerNonInterpolateRejectMinNDF, uint8_t, 5, "", 0, "Minimum NDF of track for non-interpolated reject (both for chi2 and absolute distance)")
157157
AddOptionRTC(mergeCE, uint8_t, 1, "", 0, "Merge tracks accross the central electrode")
158-
AddOptionRTC(retryRefit, int8_t, 1, "", 0, "Retry refit with seeding errors and without cluster rejection when fit fails (=2 means retry in same kernel, =1 for separate kernel")
159158
AddOptionRTC(enablePID, int8_t, 1, "", 0, "Enable PID response")
160159
AddOptionRTC(PID_useNsigma, int8_t, 1, "", 0, "Use nSigma instead of absolute distance in PID response")
161160
AddOptionRTC(adddEdxSubThresholdClusters, int8_t, 1, "", 0, "Add sub threshold clusters in TPC dEdx computation")

GPU/GPUTracking/Global/GPUChainTrackingMerger.cxx

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -227,9 +227,6 @@ int32_t GPUChainTracking::RunTPCTrackingMerger(bool synchronizeOutput)
227227
}
228228

229229
runKernel<GPUTPCGMMergerTrackFit>(doGPU ? GetGrid(Merger.NMergedTracks(), 0) : GetGridAuto(0), mergerSortTracks ? 1 : 0);
230-
if (param().rec.tpc.retryRefit == 1) {
231-
runKernel<GPUTPCGMMergerTrackFit>(GetGridAuto(0), -1);
232-
}
233230
runKernel<GPUTPCGMMergerFollowLoopers>(GetGridAuto(0));
234231

235232
DoDebugAndDump(RecoStep::TPCMerging, GPUChainTrackingDebugFlags::TPCMergingRefit, Merger, &GPUTPCGMMerger::DumpRefit, *mDebugFile);

GPU/GPUTracking/Merger/GPUTPCGMMerger.cxx

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -402,8 +402,7 @@ void* GPUTPCGMMerger::SetPointersMerger(void* mem)
402402
computePointerWithAlignment(mem, mSharedCount, mNMaxClusters);
403403
memMax = (void*)std::max((size_t)mem, (size_t)memMax);
404404
mem = memBase;
405-
computePointerWithAlignment(mem, mLoopData, mNMaxTracks); // GPUTPCGMMergerTrackFit - GPUTPCGMMergerFollowLoopers
406-
computePointerWithAlignment(mem, mRetryRefitIds, mNMaxTracks); // Reducing mNMaxTracks for mLoopData / mRetryRefitIds does not save memory, since the other parts are larger anyway
405+
computePointerWithAlignment(mem, mLoopData, mNMaxTracks); // GPUTPCGMMergerTrackFit - GPUTPCGMMergerFollowLoopers, Reducing mNMaxTracks for mLoopData does not save memory, other parts are larger anyway
407406
memMax = (void*)std::max((size_t)mem, (size_t)memMax);
408407
mem = memBase;
409408
computePointerWithAlignment(mem, mLooperCandidates, mNMaxLooperMatches); // MergeLoopers 1-3

GPU/GPUTracking/Merger/GPUTPCGMMerger.h

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -66,7 +66,6 @@ class GPUTPCGMMerger : public GPUProcessor
6666
static constexpr const int32_t NSECTORS = GPUCA_NSECTORS; //* N sectors
6767

6868
struct memory {
69-
GPUAtomic(uint32_t) nRetryRefit;
7069
GPUAtomic(uint32_t) nLoopData;
7170
GPUAtomic(uint32_t) nUnpackedTracks;
7271
GPUAtomic(uint32_t) nMergedTracks;
@@ -119,7 +118,6 @@ class GPUTPCGMMerger : public GPUProcessor
119118
GPUhdi() GPUAtomic(uint32_t) * ClusterAttachment() const { return mClusterAttachment; }
120119
GPUhdi() uint32_t* TrackOrderAttach() const { return mTrackOrderAttach; }
121120
GPUhdi() uint32_t* TrackOrderProcess() const { return mTrackOrderProcess; }
122-
GPUhdi() uint32_t* RetryRefitIds() const { return mRetryRefitIds; }
123121
GPUhdi() uint8_t* ClusterStateExt() const { return mClusterStateExt; }
124122
GPUhdi() GPUTPCGMLoopData* LoopData() const { return mLoopData; }
125123
GPUhdi() memory* Memory() const { return mMemory; }
@@ -287,7 +285,6 @@ class GPUTPCGMMerger : public GPUProcessor
287285
gputpcgmmergertypes::GPUTPCGMBorderRange* mBorderRangeMemory = nullptr; // memory for border tracks
288286
gputpcgmmergertypes::GPUTPCGMBorderRange* mBorderRange[NSECTORS]; // memory for border tracks
289287
memory* mMemory = nullptr;
290-
uint32_t* mRetryRefitIds = nullptr;
291288
GPUTPCGMLoopData* mLoopData = nullptr;
292289
};
293290
} // namespace o2::gpu

GPU/GPUTracking/Merger/GPUTPCGMMergerGPU.cxx

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -21,10 +21,9 @@ using namespace o2::gpu;
2121
template <>
2222
GPUdii() void GPUTPCGMMergerTrackFit::Thread<0>(int32_t nBlocks, int32_t nThreads, int32_t iBlock, int32_t iThread, GPUsharedref() GPUSharedMemory& smem, processorType& GPUrestrict() merger, int32_t mode)
2323
{
24-
const int32_t iEnd = mode == -1 ? merger.Memory()->nRetryRefit : merger.NMergedTracks();
25-
GPUCA_TBB_KERNEL_LOOP(merger.GetRec(), int32_t, ii, iEnd, {
26-
const int32_t i = mode == -1 ? merger.RetryRefitIds()[ii] : mode ? merger.TrackOrderProcess()[ii] : ii;
27-
GPUTPCGMTrackParam::RefitTrack(merger.MergedTracks()[i], i, &merger, mode == -1);
24+
GPUCA_TBB_KERNEL_LOOP(merger.GetRec(), int32_t, ii, merger.NMergedTracks(), {
25+
const int32_t i = mode ? merger.TrackOrderProcess()[ii] : ii;
26+
GPUTPCGMTrackParam::RefitTrack(merger.MergedTracks()[i], i, &merger);
2827
});
2928
}
3029

GPU/GPUTracking/Merger/GPUTPCGMTrackParam.cxx

Lines changed: 11 additions & 38 deletions
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@
4848
using namespace o2::gpu;
4949
using namespace o2::tpc;
5050

51-
GPUd() bool GPUTPCGMTrackParam::Fit(GPUTPCGMMerger* GPUrestrict() merger, int32_t iTrk, GPUTPCGMMergedTrackHit* GPUrestrict() clusters, int32_t& GPUrestrict() N, int32_t& GPUrestrict() NTolerated, float& GPUrestrict() Alpha, int32_t attempt, float maxSinPhi, GPUTPCGMMergedTrack& GPUrestrict() track)
51+
GPUd() bool GPUTPCGMTrackParam::Fit(GPUTPCGMMerger* GPUrestrict() merger, int32_t iTrk, GPUTPCGMMergedTrackHit* GPUrestrict() clusters, int32_t& GPUrestrict() N, int32_t& GPUrestrict() NTolerated, float& GPUrestrict() Alpha, float maxSinPhi, GPUTPCGMMergedTrack& GPUrestrict() track)
5252
{
5353
static constexpr float kDeg2Rad = M_PI / 180.f;
5454
CADEBUG(static constexpr float kSectAngle = 2 * M_PI / 18.f);
@@ -92,7 +92,7 @@ GPUd() bool GPUTPCGMTrackParam::Fit(GPUTPCGMMerger* GPUrestrict() merger, int32_
9292
const float maxSinForUpdate = CAMath::Sin(70.f * kDeg2Rad);
9393

9494
ResetCovariance();
95-
prop.SetSeedingErrors(!(refit && attempt == 0));
95+
prop.SetSeedingErrors(!(refit));
9696
prop.SetFitInProjections(true); // param.rec.fitInProjections == -1 ? (iWay == 0) : param.rec.fitInProjections); // TODO: Reenable once fixed
9797
prop.SetPropagateBzOnly(param.rec.fitPropagateBzOnly == -1 ? !finalFit : param.rec.fitPropagateBzOnly);
9898
prop.SetMatLUT((param.rec.useMatLUT && finalFit) ? merger->GetConstantMem()->calibObjects.matLUT : nullptr);
@@ -105,7 +105,6 @@ GPUd() bool GPUTPCGMTrackParam::Fit(GPUTPCGMMerger* GPUrestrict() merger, int32_
105105
const bool inFlyDirection = iWay & 1;
106106
const int32_t wayDirection = (iWay & 1) ? -1 : 1;
107107

108-
int32_t goodRows = 0;
109108
for (int32_t ihit = ihitStart; ihit >= 0 && ihit < maxN; ihit += wayDirection) {
110109
const bool crossCE = lastSector != 255 && ((lastSector < 18) ^ (clusters[ihit].sector < 18));
111110
if (crossCE) {
@@ -179,11 +178,6 @@ GPUd() bool GPUTPCGMTrackParam::Fit(GPUTPCGMMerger* GPUrestrict() merger, int32_
179178
retValProp = prop.PropagateToXAlpha(xx, clAlpha, inFlyDirection);
180179
}
181180
}
182-
if (lastRow == 255 || CAMath::Abs((int32_t)lastRow - (int32_t)cluster.row) > 5 || lastSector != cluster.sector || (param.rec.tpc.trackFitRejectMode < 0 && -nMissed <= param.rec.tpc.trackFitRejectMode)) {
183-
goodRows = 0;
184-
} else {
185-
goodRows++;
186-
}
187181
if (retValProp == 0) {
188182
lastRow = cluster.row;
189183
lastSector = cluster.sector;
@@ -228,17 +222,13 @@ GPUd() bool GPUTPCGMTrackParam::Fit(GPUTPCGMMerger* GPUrestrict() merger, int32_
228222
retValUpd = GPUTPCGMPropagator::updateErrorClusterRejectedDistance;
229223
} else {
230224
int8_t rejectChi2 = 0;
231-
if (attempt == 0) {
232-
if (param.rec.tpc.mergerInterpolateErrors && CAMath::Abs(ihit - ihitMergeFirst) <= 1) {
233-
if (iWay == nWays - 3) {
234-
rejectChi2 = GPUTPCGMPropagator::rejectInterFill;
235-
} else if (iWay == nWays - 2) {
236-
rejectChi2 = GPUTPCGMPropagator::rejectInterReject;
237-
} else if (iWay == nWays - 1) {
238-
rejectChi2 = (param.rec.tpc.mergerInterpolateRejectAlsoOnCurrentPosition && GetNDF() > (int32_t)param.rec.tpc.mergerNonInterpolateRejectMinNDF) ? GPUTPCGMPropagator::rejectDirect : 0;
239-
}
240-
} else {
241-
rejectChi2 = allowChangeClusters && goodRows > 5;
225+
if (param.rec.tpc.mergerInterpolateErrors && CAMath::Abs(ihit - ihitMergeFirst) <= 1) {
226+
if (iWay == nWays - 3) {
227+
rejectChi2 = GPUTPCGMPropagator::rejectInterFill;
228+
} else if (iWay == nWays - 2) {
229+
rejectChi2 = GPUTPCGMPropagator::rejectInterReject;
230+
} else if (iWay == nWays - 1) {
231+
rejectChi2 = (param.rec.tpc.mergerInterpolateRejectAlsoOnCurrentPosition && GetNDF() > (int32_t)param.rec.tpc.mergerNonInterpolateRejectMinNDF) ? GPUTPCGMPropagator::rejectDirect : 0;
242232
}
243233
}
244234

@@ -905,7 +895,7 @@ GPUd() bool GPUTPCGMTrackParam::CheckNumericalQuality(float overrideCovYY) const
905895
return ok;
906896
}
907897

908-
GPUdii() void GPUTPCGMTrackParam::RefitTrack(GPUTPCGMMergedTrack& GPUrestrict() track, int32_t iTrk, GPUTPCGMMerger* GPUrestrict() merger, int32_t attempt) // VS: GPUd changed to GPUdii. No change in output and no performance penalty.
898+
GPUdii() void GPUTPCGMTrackParam::RefitTrack(GPUTPCGMMergedTrack& GPUrestrict() track, int32_t iTrk, GPUTPCGMMerger* GPUrestrict() merger) // VS: GPUd changed to GPUdii. No change in output and no performance penalty.
909899
{
910900
if (!track.OK()) {
911901
return;
@@ -920,27 +910,10 @@ GPUdii() void GPUTPCGMTrackParam::RefitTrack(GPUTPCGMMergedTrack& GPUrestrict()
920910
GPUTPCGMTrackParam t = track.Param();
921911
float Alpha = track.Alpha();
922912
CADEBUG(int32_t nTrackHitsOld = nTrackHits; float ptOld = t.QPt());
923-
bool ok = t.Fit(merger, iTrk, merger->Clusters() + track.FirstClusterRef(), nTrackHits, NTolerated, Alpha, attempt, GPUCA_MAX_SIN_PHI, track);
913+
bool ok = t.Fit(merger, iTrk, merger->Clusters() + track.FirstClusterRef(), nTrackHits, NTolerated, Alpha, GPUCA_MAX_SIN_PHI, track);
924914
CADEBUG(printf("Finished Fit Track %d\n", iTrk));
925915
CADEBUG(printf("OUTPUT hits %d -> %d+%d = %d, QPt %f -> %f, SP %f, OK %d chi2 %f chi2ndf %f\n", nTrackHitsOld, nTrackHits, NTolerated, nTrackHits + NTolerated, ptOld, t.QPt(), t.SinPhi(), (int32_t)ok, t.Chi2(), t.Chi2() / CAMath::Max(1, nTrackHits)));
926916

927-
if (!ok && attempt == 0 && merger->Param().rec.tpc.retryRefit) {
928-
for (uint32_t i = 0; i < track.NClusters(); i++) {
929-
merger->Clusters()[track.FirstClusterRef() + i].state &= GPUTPCGMMergedTrackHit::clustererAndSharedFlags;
930-
}
931-
CADEBUG(printf("Track rejected, marking for retry\n"));
932-
if (merger->Param().rec.tpc.retryRefit == 2) {
933-
nTrackHits = track.NClusters();
934-
NTolerated = 0; // Clusters not fit but tollerated for track length cut
935-
t = track.Param();
936-
Alpha = track.Alpha();
937-
ok = t.Fit(merger, iTrk, merger->Clusters() + track.FirstClusterRef(), nTrackHits, NTolerated, Alpha, 1, GPUCA_MAX_SIN_PHI, track);
938-
} else {
939-
uint32_t nRefit = CAMath::AtomicAdd(&merger->Memory()->nRetryRefit, 1u);
940-
merger->RetryRefitIds()[nRefit] = iTrk;
941-
return;
942-
}
943-
}
944917
if (CAMath::Abs(t.QPt()) < 1.e-4f) {
945918
t.QPt() = 1.e-4f;
946919
}

GPU/GPUTracking/Merger/GPUTPCGMTrackParam.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -141,7 +141,7 @@ class GPUTPCGMTrackParam
141141
GPUd() bool CheckNumericalQuality(float overrideCovYY = -1.f) const;
142142
GPUd() bool CheckCov() const;
143143

144-
GPUd() bool Fit(GPUTPCGMMerger* merger, int32_t iTrk, GPUTPCGMMergedTrackHit* clusters, int32_t& N, int32_t& NTolerated, float& Alpha, int32_t attempt, float maxSinPhi, GPUTPCGMMergedTrack& track);
144+
GPUd() bool Fit(GPUTPCGMMerger* merger, int32_t iTrk, GPUTPCGMMergedTrackHit* clusters, int32_t& N, int32_t& NTolerated, float& Alpha, float maxSinPhi, GPUTPCGMMergedTrack& track);
145145
GPUd() void MoveToReference(GPUTPCGMPropagator& prop, const GPUParam& param, float& alpha);
146146
GPUd() void MirrorTo(GPUTPCGMPropagator& prop, float toY, float toZ, bool inFlyDirection, const GPUParam& param, uint8_t row, uint8_t clusterState, bool mirrorParameters, int8_t sector);
147147
GPUd() int32_t MergeDoubleRowClusters(int32_t& ihit, int32_t wayDirection, GPUTPCGMMergedTrackHit* clusters, const GPUTPCGMMerger* merger, GPUTPCGMPropagator& prop, float& xx, float& yy, float& zz, int32_t maxN, float clAlpha, uint8_t& clusterState, bool rejectChi2);
@@ -200,7 +200,7 @@ class GPUTPCGMTrackParam
200200
}
201201
}
202202

203-
GPUd() static void RefitTrack(GPUTPCGMMergedTrack& track, int32_t iTrk, GPUTPCGMMerger* merger, int32_t attempt);
203+
GPUd() static void RefitTrack(GPUTPCGMMergedTrack& track, int32_t iTrk, GPUTPCGMMerger* merger);
204204

205205
GPUdi() void ConstrainSinPhi(float limit = GPUCA_MAX_SIN_PHI)
206206
{

0 commit comments

Comments
 (0)