@@ -630,23 +630,23 @@ int32_t GPUChainTracking::RunTPCClusterizer(bool synchronizeOutput)
630630 mRec ->runParallelOuterLoop (doGPU, numLanes, [&](uint32_t lane) {
631631 nnApplications[lane].init (nn_settings);
632632 if (nnApplications[lane].modelsUsed [0 ]) {
633- SetONNXGPUStream ((nnApplications[lane].model_class ).getSessionOptions (), lane + numLanes , &deviceId);
633+ SetONNXGPUStream ((nnApplications[lane].model_class ).getSessionOptions (), lane, &deviceId);
634634 (nnApplications[lane].model_class ).setDeviceId (deviceId);
635635 if (nnApplications[lane].model_class .getIntraOpNumThreads () > maxThreads) {
636636 nnApplications[lane].model_class .setIntraOpNumThreads (maxThreads);
637637 }
638638 (nnApplications[lane].model_class ).initEnvironment ();
639639 }
640640 if (nnApplications[lane].modelsUsed [1 ]) {
641- SetONNXGPUStream ((nnApplications[lane].model_reg_1 ).getSessionOptions (), lane + 2 *numLanes , &deviceId);
641+ SetONNXGPUStream ((nnApplications[lane].model_reg_1 ).getSessionOptions (), lane, &deviceId);
642642 (nnApplications[lane].model_reg_1 ).setDeviceId (deviceId);
643643 if (nnApplications[lane].model_reg_1 .getIntraOpNumThreads () > maxThreads) {
644644 nnApplications[lane].model_reg_1 .setIntraOpNumThreads (maxThreads);
645645 }
646646 (nnApplications[lane].model_reg_1 ).initEnvironment ();
647647 }
648648 if (nnApplications[lane].modelsUsed [2 ]) {
649- SetONNXGPUStream ((nnApplications[lane].model_reg_2 ).getSessionOptions (), lane + 3 *numLanes , &deviceId);
649+ SetONNXGPUStream ((nnApplications[lane].model_reg_2 ).getSessionOptions (), lane, &deviceId);
650650 (nnApplications[lane].model_reg_2 ).setDeviceId (deviceId);
651651 if (nnApplications[lane].model_reg_2 .getIntraOpNumThreads () > maxThreads) {
652652 nnApplications[lane].model_reg_2 .setIntraOpNumThreads (maxThreads);
@@ -1039,7 +1039,6 @@ int32_t GPUChainTracking::RunTPCClusterizer(bool synchronizeOutput)
10391039 }
10401040 LOG (info) << " [NN CF] Apply NN (fragment " << fragment.index << " , lane: " << lane << " , sector: " << iSector << " ): filling data " << time_fill << " s ; networks: " << time_networks << " s ; clusterizer: " << time_clusterizer << " s ; " << clusterer.mPmemory ->counters .nClusters << " clusters, " << acceptedClusters << " accepted. --> " << (int32_t )clusterer.mPmemory ->counters .nClusters / (time_fill + time_clusterizer) << " clusters/s" ;
10411041 }
1042- TransferMemoryResourcesToHost (RecoStep::TPCClusterFinding, &clustererNN, lane);
10431042#else
10441043 GPUFatal (" Project not compiled with neural network clusterization. Aborting." );
10451044#endif
0 commit comments