@@ -311,7 +311,7 @@ GPUdii() gpuSpan<const Cluster> getClustersOnLayer(const int rof,
311311}
312312
313313template <int nLayers>
314- GPUg () void fitTrackSeedsKernel (
314+ GPUg () void __launch_bounds__ ( 256 , 1 ) fitTrackSeedsKernel(
315315 CellSeed<nLayers>* trackSeeds,
316316 const TrackingFrameInfo** foundTrackingFrameInfo,
317317 o2::its::TrackITSExt* tracks,
@@ -374,7 +374,7 @@ GPUg() void fitTrackSeedsKernel(
374374}
375375
376376template <bool initRun, int nLayers = 7 >
377- GPUg () void computeLayerCellNeighboursKernel (
377+ GPUg () void __launch_bounds__ ( 256 , 1 ) computeLayerCellNeighboursKernel(
378378 CellSeed<nLayers>** cellSeedArray,
379379 int * neighboursLUT,
380380 int * neighboursIndexTable,
@@ -438,7 +438,7 @@ GPUg() void computeLayerCellNeighboursKernel(
438438}
439439
440440template <bool initRun, int nLayers>
441- GPUg () void computeLayerCellsKernel (
441+ GPUg () void __launch_bounds__ ( 256 , 1 ) computeLayerCellsKernel(
442442 const Cluster** sortedClusters,
443443 const Cluster** unsortedClusters,
444444 const TrackingFrameInfo** tfInfo,
@@ -525,7 +525,7 @@ GPUg() void computeLayerCellsKernel(
525525}
526526
527527template <bool initRun, int nLayers>
528- GPUg () void computeLayerTrackletsMultiROFKernel (
528+ GPUg () void __launch_bounds__ ( 256 , 1 ) computeLayerTrackletsMultiROFKernel(
529529 const IndexTableUtils<nLayers>* utils,
530530 const uint8_t * multMask,
531531 const int layerIndex,
@@ -652,7 +652,8 @@ GPUg() void computeLayerTrackletsMultiROFKernel(
652652 }
653653}
654654
655- GPUg () void compileTrackletsLookupTableKernel (const Tracklet* tracklets,
655+ GPUg () void __launch_bounds__ (256 , 1 ) compileTrackletsLookupTableKernel(
656+ const Tracklet* tracklets,
656657 int * trackletsLookUpTable,
657658 const int nTracklets)
658659{
@@ -662,7 +663,8 @@ GPUg() void compileTrackletsLookupTableKernel(const Tracklet* tracklets,
662663}
663664
664665template <bool dryRun, int nLayers = 7 >
665- GPUg () void processNeighboursKernel (const int layer,
666+ GPUg () void __launch_bounds__ (256 , 1 ) processNeighboursKernel(
667+ const int layer,
666668 const int level,
667669 CellSeed<nLayers>** allCellSeeds,
668670 CellSeed<nLayers>* currentCellSeeds,
0 commit comments