Simplify GPUCAMath a bit

davidrohr · davidrohr · commit 3d0c1b290254 · 2025-03-13T09:02:24.000+01:00
diff --git a/GPU/Common/GPUCommonMath.h b/GPU/Common/GPUCommonMath.h
@@ -33,6 +33,15 @@
 #include <cstdint>
 #endif
 
+// GPUCA_CHOICE Syntax: GPUCA_CHOICE(Host, CUDA&HIP, OpenCL)
+#if defined(GPUCA_GPUCODE_DEVICE) && (defined(__CUDACC__) || defined(__HIPCC__)) // clang-format off
+    #define GPUCA_CHOICE(c1, c2, c3) (c2) // Select second option for CUDA and HIP
+#elif defined(GPUCA_GPUCODE_DEVICE) && defined (__OPENCL__)
+    #define GPUCA_CHOICE(c1, c2, c3) (c3) // Select third option for OpenCL
+#else
+    #define GPUCA_CHOICE(c1, c2, c3) (c1) // Select first option for Host
+#endif // clang-format on
+
 namespace o2
 {
 namespace gpu
@@ -44,9 +53,15 @@ class GPUCommonMath
   GPUd() static float2 MakeFloat2(float x, float y); // TODO: Find better appraoch that is constexpr
 
   template <class T>
-  GPUhd() static T Min(const T x, const T y);
+  GPUhd() static T Min(const T x, const T y)
+  {
+    return GPUCA_CHOICE(std::min(x, y), min(x, y), min(x, y));
+  }
   template <class T>
-  GPUhd() static T Max(const T x, const T y);
+  GPUhd() static T Max(const T x, const T y)
+  {
+    return GPUCA_CHOICE(std::max(x, y), max(x, y), max(x, y));
+  }
   template <class T, class S, class R>
   GPUd() static T MinWithRef(T x, T y, S refX, S refY, R& r);
   template <class T, class S, class R>
@@ -74,28 +89,28 @@ class GPUCommonMath
   GPUd() static float Pow(float x, float y);
   GPUd() static float Log(float x);
   GPUd() static float Exp(float x);
-  GPUhdni() static float Copysign(float x, float y);
+  GPUhdni() static float Copysign(float x, float y) { return GPUCA_CHOICE(std::copysignf(x, y), copysignf(x, y), copysign(x, y)); }
   GPUd() static constexpr float TwoPi() { return 6.2831853f; }
   GPUd() static constexpr float Pi() { return 3.1415927f; }
   GPUd() static float Round(float x);
-  GPUd() static float Floor(float x);
+  GPUd() static float Floor(float x) { return GPUCA_CHOICE(floorf(x), floorf(x), floor(x)); }
   GPUd() static uint32_t Float2UIntReint(const float& x);
-  GPUd() static uint32_t Float2UIntRn(float x);
+  GPUd() static uint32_t Float2UIntRn(float x) { return (uint32_t)(int32_t)(x + 0.5f); }
   GPUd() static int32_t Float2IntRn(float x);
   GPUd() static float Modf(float x, float y);
-  GPUd() static bool Finite(float x);
-  GPUd() static bool IsNaN(float x);
+  GPUd() static bool Finite(float x) { return GPUCA_CHOICE(std::isfinite(x), isfinite(x), isfinite(x)); }
+  GPUd() static bool IsNaN(float x) { return GPUCA_CHOICE(std::isnan(x), isnan(x), isnan(x)); }
   GPUd() static bool FiniteRelaxed(float x); // always true if not using NO_FAST_MATH
   GPUd() static bool IsNaNRelaxed(float x);  // always true if not using NO_FAST_MATH
-  GPUd() static float QuietNaN();
+  GPUd() static float QuietNaN() { return GPUCA_CHOICE(std::numeric_limits<float>::quiet_NaN(), __builtin_nanf(""), nan(0u)); }
   GPUd() static uint32_t Clz(uint32_t val);
   GPUd() static uint32_t Popcount(uint32_t val);
 
   GPUd() static void memcpy(void* dst, const void* src, size_t size);
 
-  GPUhdni() static float Hypot(float x, float y);
-  GPUhdni() static float Hypot(float x, float y, float z);
-  GPUhdni() static float Hypot(float x, float y, float z, float w);
+  GPUhdi() static float Hypot(float x, float y) { return Sqrt(x * x + y * y); }
+  GPUhdi() static float Hypot(float x, float y, float z) { return Sqrt(x * x + y * y + z * z); }
+  GPUhdi() static float Hypot(float x, float y, float z, float w) { return Sqrt(x * x + y * y + z * z + w * w); }
 
   template <typename T>
   GPUhd() static void Swap(T& a, T& b);
@@ -154,15 +169,7 @@ class GPUCommonMath
   GPUd() constexpr static T nextMultipleOf(T val);
 
   template <typename... Args>
-  GPUdi() static float Sum2(float w, Args... args)
-  {
-    if constexpr (sizeof...(Args) == 0) {
-      return w * w;
-    } else {
-      return w * w + Sum2(args...);
-    }
-    return 0;
-  }
+  GPUhdni() static float Sum2(float w, Args... args);
 
  private:
   template <class S, class T>
@@ -179,14 +186,16 @@ class GPUCommonMath
 
 typedef GPUCommonMath CAMath;
 
-// CHOICE Syntax: CHOICE(Host, CUDA&HIP, OpenCL)
-#if defined(GPUCA_GPUCODE_DEVICE) && (defined(__CUDACC__) || defined(__HIPCC__)) // clang-format off
-    #define CHOICE(c1, c2, c3) (c2) // Select second option for CUDA and HIP
-#elif defined(GPUCA_GPUCODE_DEVICE) && defined (__OPENCL__)
-    #define CHOICE(c1, c2, c3) (c3) // Select third option for OpenCL
-#else
-    #define CHOICE(c1, c2, c3) (c1) // Select first option for Host
-#endif // clang-format on
+template <typename... Args>
+GPUhdi() float GPUCommonMath::Sum2(float w, Args... args)
+{
+  if constexpr (sizeof...(Args) == 0) {
+    return w * w;
+  } else {
+    return w * w + Sum2(args...);
+  }
+  return 0;
+}
 
 GPUdi() void GPUCommonMath::memcpy(void* dst, const void* src, size_t size)
 {
@@ -230,7 +239,7 @@ GPUdi() float2 GPUCommonMath::MakeFloat2(float x, float y)
 #endif // GPUCA_GPUCODE
 }
 
-GPUdi() float GPUCommonMath::Modf(float x, float y) { return CHOICE(fmodf(x, y), fmodf(x, y), fmod(x, y)); }
+GPUdi() float GPUCommonMath::Modf(float x, float y) { return GPUCA_CHOICE(fmodf(x, y), fmodf(x, y), fmod(x, y)); }
 
 GPUdi() uint32_t GPUCommonMath::Float2UIntReint(const float& x)
 {
@@ -243,42 +252,36 @@ GPUdi() uint32_t GPUCommonMath::Float2UIntReint(const float& x)
 #endif
 }
 
-GPUdi() uint32_t GPUCommonMath::Float2UIntRn(float x) { return (uint32_t)(int32_t)(x + 0.5f); }
-GPUdi() float GPUCommonMath::Floor(float x) { return CHOICE(floorf(x), floorf(x), floor(x)); }
-
-GPUdi() bool GPUCommonMath::Finite(float x) { return CHOICE(std::isfinite(x), isfinite(x), isfinite(x)); }
-GPUdi() bool GPUCommonMath::IsNaN(float x) { return CHOICE(std::isnan(x), isnan(x), isnan(x)); }
-GPUdi() float GPUCommonMath::QuietNaN() { return CHOICE(std::numeric_limits<float>::quiet_NaN(), __builtin_nanf(""), nan(0u)); }
 #ifdef GPUCA_NO_FAST_MATH
-GPUdi() float GPUCommonMath::Round(float x) { return CHOICE(roundf(x), roundf(x), round(x)); }
+GPUdi() float GPUCommonMath::Round(float x) { return GPUCA_CHOICE(roundf(x), roundf(x), round(x)); }
 GPUdi() int32_t GPUCommonMath::Float2IntRn(float x) { return (int32_t)Round(x); }
-GPUhdi() float GPUCommonMath::Sqrt(float x) { return CHOICE(sqrtf(x), (float)sqrt((double)x), sqrt(x)); }
-GPUdi() float GPUCommonMath::ATan(float x) { return CHOICE((float)atan((double)x), (float)atan((double)x), atan(x)); }
-GPUhdi() float GPUCommonMath::ATan2(float y, float x) { return CHOICE((float)atan2((double)y, (double)x), (float)atan2((double)y, (double)x), atan2(y, x)); }
-GPUdi() float GPUCommonMath::Sin(float x) { return CHOICE((float)sin((double)x), (float)sin((double)x), sin(x)); }
-GPUdi() float GPUCommonMath::Cos(float x) { return CHOICE((float)cos((double)x), (float)cos((double)x), cos(x)); }
-GPUdi() float GPUCommonMath::Tan(float x) { return CHOICE((float)tanf((double)x), (float)tanf((double)x), tan(x)); }
-GPUdi() float GPUCommonMath::Pow(float x, float y) { return CHOICE((float)pow((double)x, (double)y), pow((double)x, (double)y), pow(x, y)); }
-GPUdi() float GPUCommonMath::ASin(float x) { return CHOICE((float)asin((double)x), (float)asin((double)x), asin(x)); }
-GPUdi() float GPUCommonMath::ACos(float x) { return CHOICE((float)acos((double)x), (float)acos((double)x), acos(x)); }
-GPUdi() float GPUCommonMath::Log(float x) { return CHOICE((float)log((double)x), (float)log((double)x), log(x)); }
-GPUdi() float GPUCommonMath::Exp(float x) { return CHOICE((float)exp((double)x), (float)exp((double)x), exp(x)); }
+GPUhdi() float GPUCommonMath::Sqrt(float x) { return GPUCA_CHOICE(sqrtf(x), (float)sqrt((double)x), sqrt(x)); }
+GPUdi() float GPUCommonMath::ATan(float x) { return GPUCA_CHOICE((float)atan((double)x), (float)atan((double)x), atan(x)); }
+GPUhdi() float GPUCommonMath::ATan2(float y, float x) { return GPUCA_CHOICE((float)atan2((double)y, (double)x), (float)atan2((double)y, (double)x), atan2(y, x)); }
+GPUdi() float GPUCommonMath::Sin(float x) { return GPUCA_CHOICE((float)sin((double)x), (float)sin((double)x), sin(x)); }
+GPUdi() float GPUCommonMath::Cos(float x) { return GPUCA_CHOICE((float)cos((double)x), (float)cos((double)x), cos(x)); }
+GPUdi() float GPUCommonMath::Tan(float x) { return GPUCA_CHOICE((float)tanf((double)x), (float)tanf((double)x), tan(x)); }
+GPUdi() float GPUCommonMath::Pow(float x, float y) { return GPUCA_CHOICE((float)pow((double)x, (double)y), pow((double)x, (double)y), pow(x, y)); }
+GPUdi() float GPUCommonMath::ASin(float x) { return GPUCA_CHOICE((float)asin((double)x), (float)asin((double)x), asin(x)); }
+GPUdi() float GPUCommonMath::ACos(float x) { return GPUCA_CHOICE((float)acos((double)x), (float)acos((double)x), acos(x)); }
+GPUdi() float GPUCommonMath::Log(float x) { return GPUCA_CHOICE((float)log((double)x), (float)log((double)x), log(x)); }
+GPUdi() float GPUCommonMath::Exp(float x) { return GPUCA_CHOICE((float)exp((double)x), (float)exp((double)x), exp(x)); }
 GPUdi() bool GPUCommonMath::FiniteRelaxed(float x) { return Finite(x); }
 GPUdi() bool GPUCommonMath::IsNaNRelaxed(float x) { return IsNaN(x); }
 #else
-GPUdi() float GPUCommonMath::Round(float x) { return CHOICE(roundf(x), rintf(x), rint(x)); }
-GPUdi() int32_t GPUCommonMath::Float2IntRn(float x) { return CHOICE((int32_t)Round(x), __float2int_rn(x), (int32_t)Round(x)); }
-GPUhdi() float GPUCommonMath::Sqrt(float x) { return CHOICE(sqrtf(x), sqrtf(x), sqrt(x)); }
-GPUdi() float GPUCommonMath::ATan(float x) { return CHOICE(atanf(x), atanf(x), atan(x)); }
-GPUhdi() float GPUCommonMath::ATan2(float y, float x) { return CHOICE(atan2f(y, x), atan2f(y, x), atan2(y, x)); }
-GPUdi() float GPUCommonMath::Sin(float x) { return CHOICE(sinf(x), sinf(x), sin(x)); }
-GPUdi() float GPUCommonMath::Cos(float x) { return CHOICE(cosf(x), cosf(x), cos(x)); }
-GPUdi() float GPUCommonMath::Tan(float x) { return CHOICE(tanf(x), tanf(x), tan(x)); }
-GPUdi() float GPUCommonMath::Pow(float x, float y) { return CHOICE(powf(x, y), powf(x, y), pow(x, y)); }
-GPUdi() float GPUCommonMath::ASin(float x) { return CHOICE(asinf(x), asinf(x), asin(x)); }
-GPUdi() float GPUCommonMath::ACos(float x) { return CHOICE(acosf(x), acosf(x), acos(x)); }
-GPUdi() float GPUCommonMath::Log(float x) { return CHOICE(logf(x), logf(x), log(x)); }
-GPUdi() float GPUCommonMath::Exp(float x) { return CHOICE(expf(x), expf(x), exp(x)); }
+GPUdi() float GPUCommonMath::Round(float x) { return GPUCA_CHOICE(roundf(x), rintf(x), rint(x)); }
+GPUdi() int32_t GPUCommonMath::Float2IntRn(float x) { return GPUCA_CHOICE((int32_t)Round(x), __float2int_rn(x), (int32_t)Round(x)); }
+GPUhdi() float GPUCommonMath::Sqrt(float x) { return GPUCA_CHOICE(sqrtf(x), sqrtf(x), sqrt(x)); }
+GPUdi() float GPUCommonMath::ATan(float x) { return GPUCA_CHOICE(atanf(x), atanf(x), atan(x)); }
+GPUhdi() float GPUCommonMath::ATan2(float y, float x) { return GPUCA_CHOICE(atan2f(y, x), atan2f(y, x), atan2(y, x)); }
+GPUdi() float GPUCommonMath::Sin(float x) { return GPUCA_CHOICE(sinf(x), sinf(x), sin(x)); }
+GPUdi() float GPUCommonMath::Cos(float x) { return GPUCA_CHOICE(cosf(x), cosf(x), cos(x)); }
+GPUdi() float GPUCommonMath::Tan(float x) { return GPUCA_CHOICE(tanf(x), tanf(x), tan(x)); }
+GPUdi() float GPUCommonMath::Pow(float x, float y) { return GPUCA_CHOICE(powf(x, y), powf(x, y), pow(x, y)); }
+GPUdi() float GPUCommonMath::ASin(float x) { return GPUCA_CHOICE(asinf(x), asinf(x), asin(x)); }
+GPUdi() float GPUCommonMath::ACos(float x) { return GPUCA_CHOICE(acosf(x), acosf(x), acos(x)); }
+GPUdi() float GPUCommonMath::Log(float x) { return GPUCA_CHOICE(logf(x), logf(x), log(x)); }
+GPUdi() float GPUCommonMath::Exp(float x) { return GPUCA_CHOICE(expf(x), expf(x), exp(x)); }
 GPUdi() bool GPUCommonMath::FiniteRelaxed(float x) { return true; }
 GPUdi() bool GPUCommonMath::IsNaNRelaxed(float x) { return false; }
 #endif
@@ -293,7 +296,7 @@ GPUhdi() void GPUCommonMath::SinCos(float x, float& s, float& c)
 #elif !defined(GPUCA_GPUCODE_DEVICE) && (defined(__GNU_SOURCE__) || defined(_GNU_SOURCE) || defined(GPUCA_GPUCODE))
   sincosf(x, &s, &c);
 #else
-  CHOICE((void)((s = sinf(x)) + (c = cosf(x))), sincosf(x, &s, &c), s = sincos(x, &c));
+  GPUCA_CHOICE((void)((s = sinf(x)) + (c = cosf(x))), sincosf(x, &s, &c), s = sincos(x, &c));
 #endif
 }
 
@@ -304,14 +307,14 @@ GPUhdi() void GPUCommonMath::SinCosd(double x, double& s, double& c)
 #elif !defined(GPUCA_GPUCODE_DEVICE) && (defined(__GNU_SOURCE__) || defined(_GNU_SOURCE) || defined(GPUCA_GPUCODE))
   sincos(x, &s, &c);
 #else
-  CHOICE((void)((s = sin(x)) + (c = cos(x))), sincos(x, &s, &c), s = sincos(x, &c));
+  GPUCA_CHOICE((void)((s = sin(x)) + (c = cos(x))), sincos(x, &s, &c), s = sincos(x, &c));
 #endif
 }
 
 GPUdi() uint32_t GPUCommonMath::Clz(uint32_t x)
 {
 #if (defined(__GNUC__) || defined(__clang__) || defined(__CUDACC__) || defined(__HIPCC__))
-  return x == 0 ? 32 : CHOICE(__builtin_clz(x), __clz(x), __builtin_clz(x)); // use builtin if available
+  return x == 0 ? 32 : GPUCA_CHOICE(__builtin_clz(x), __clz(x), __builtin_clz(x)); // use builtin if available
 #else
   for (int32_t i = 31; i >= 0; i--) {
     if (x & (1u << i)) {
@@ -326,53 +329,24 @@ GPUdi() uint32_t GPUCommonMath::Popcount(uint32_t x)
 {
 #if (defined(__GNUC__) || defined(__clang__) || defined(__CUDACC__) || defined(__HIPCC__)) && !defined(__OPENCL__) // TODO: remove OPENCL when reported SPIR-V bug is fixed
   // use builtin if available
-  return CHOICE(__builtin_popcount(x), __popc(x), __builtin_popcount(x));
+  return GPUCA_CHOICE(__builtin_popcount(x), __popc(x), __builtin_popcount(x));
 #else
   x = x - ((x >> 1) & 0x55555555);
   x = (x & 0x33333333) + ((x >> 2) & 0x33333333);
   return (((x + (x >> 4)) & 0x0F0F0F0F) * 0x01010101) >> 24;
 #endif
 }
 
-GPUhdi() float GPUCommonMath::Hypot(float x, float y)
-{
-  return Sqrt(x * x + y * y);
-}
-
-GPUhdi() float GPUCommonMath::Hypot(float x, float y, float z)
-{
-  return Sqrt(x * x + y * y + z * z);
-}
-
-GPUhdi() float GPUCommonMath::Hypot(float x, float y, float z, float w)
-{
-  return Sqrt(x * x + y * y + z * z + w * w);
-}
-
 template <typename T>
-GPUd() void _swap(T& a, T& b)
+GPUhdi() void GPUCommonMath::Swap(T& a, T& b)
 {
+#ifndef GPUCA_GPUCODE_DEVICE
+  std::swap(a, b);
+#else
   T tmp = a;
   a = b;
   b = tmp;
-}
-
-template <typename T>
-GPUhdi() void GPUCommonMath::Swap(T& a, T& b)
-{
-  CHOICE(std::swap(a, b), _swap<T>(a, b), _swap<T>(a, b));
-}
-
-template <class T>
-GPUhdi() T GPUCommonMath::Min(const T x, const T y)
-{
-  return CHOICE(std::min(x, y), min(x, y), min(x, y));
-}
-
-template <class T>
-GPUhdi() T GPUCommonMath::Max(const T x, const T y)
-{
-  return CHOICE(std::max(x, y), max(x, y), max(x, y));
+#endif
 }
 
 template <class T, class S, class R>
@@ -441,32 +415,19 @@ GPUdi() float GPUCommonMath::InvSqrt(float _x)
 template <>
 GPUhdi() float GPUCommonMath::Abs<float>(float x)
 {
-  return CHOICE(fabsf(x), fabsf(x), fabs(x));
+  return GPUCA_CHOICE(fabsf(x), fabsf(x), fabs(x));
 }
 
-#if !defined(__OPENCL__) || defined(cl_khr_fp64)
 template <>
 GPUhdi() double GPUCommonMath::Abs<double>(double x)
 {
-  return CHOICE(fabs(x), fabs(x), fabs(x));
+  return GPUCA_CHOICE(fabs(x), fabs(x), fabs(x));
 }
-#endif
 
 template <>
 GPUhdi() int32_t GPUCommonMath::Abs<int32_t>(int32_t x)
 {
-  return CHOICE(abs(x), abs(x), abs(x));
-}
-
-GPUhdi() float GPUCommonMath::Copysign(float x, float y)
-{
-#if defined(__OPENCL__)
-  return copysign(x, y);
-#elif defined(GPUCA_GPUCODE) && !defined(__OPENCL__)
-  return copysignf(x, y);
-#else
-  return std::copysignf(x, y);
-#endif // GPUCA_GPUCODE
+  return GPUCA_CHOICE(abs(x), abs(x), abs(x));
 }
 
 template <class S, class T>
@@ -579,7 +540,7 @@ GPUdii() void GPUCommonMath::AtomicMinInternal(GPUglobalref() GPUgeneric() GPUAt
 }
 #endif
 
-#undef CHOICE
+#undef GPUCA_CHOICE
 
 } // namespace gpu
 } // namespace o2
diff --git a/GPU/GPUTracking/DataCompression/GPUTPCCompressionKernels.cxx b/GPU/GPUTracking/DataCompression/GPUTPCCompressionKernels.cxx
@@ -199,7 +199,7 @@ GPUdii() void GPUTPCCompressionKernels::Thread<GPUTPCCompressionKernels::step1un
 
     CompressedClustersPtrs& GPUrestrict() c = compressor.mPtrs;
 
-    const uint32_t nn = GPUCommonMath::nextMultipleOf<GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionKernels_step1unattached)>(clusters->nClusters[iSector][iRow]);
+    const uint32_t nn = CAMath::nextMultipleOf<GPUCA_GET_THREAD_COUNT(GPUCA_LB_GPUTPCCompressionKernels_step1unattached)>(clusters->nClusters[iSector][iRow]);
     for (uint32_t i = iThread; i < nn + nThreads; i += nThreads) {
       const int32_t idx = idOffset + i;
       int32_t cidx = 0;
diff --git a/GPU/GPUTracking/TRDTracking/GPUTRDTracker.cxx b/GPU/GPUTracking/TRDTracking/GPUTRDTracker.cxx
@@ -787,8 +787,8 @@ GPUd() bool GPUTRDTracker_t<TRDTRK, PROP>::FollowProlongation(PROP* prop, TRDTRK
         if (mHypothesis[iUpdate + hypothesisIdxOffset].mTrackletId == trkltIdx) {
           continue;
         }
-        if (GPUCommonMath::Abs(tracklets[mHypothesis[iUpdate + hypothesisIdxOffset].mTrackletId].GetZbin() - tracklets[trkltIdx].GetZbin()) == 1 &&
-            GPUCommonMath::Abs(tracklets[mHypothesis[iUpdate + hypothesisIdxOffset].mTrackletId].GetY() - tracklets[trkltIdx].GetY()) < 1) {
+        if (CAMath::Abs(tracklets[mHypothesis[iUpdate + hypothesisIdxOffset].mTrackletId].GetZbin() - tracklets[trkltIdx].GetZbin()) == 1 &&
+            CAMath::Abs(tracklets[mHypothesis[iUpdate + hypothesisIdxOffset].mTrackletId].GetY() - tracklets[trkltIdx].GetY()) < 1) {
           trkWork->setIsCrossingNeighbor(iLayer);
           trkWork->setHasNeighbor();
           break;
diff --git a/GPU/GPUTracking/display/render/GPUDisplayDraw.cxx b/GPU/GPUTracking/display/render/GPUDisplayDraw.cxx
@@ -64,7 +64,7 @@ inline void GPUDisplay::drawPointLinestrip(int32_t iSector, int32_t cid, int32_t
   mVertexBuffer[iSector].emplace_back(mGlobalPos[cid].x, mGlobalPos[cid].y * mYFactor, mCfgH.projectXY ? 0 : mGlobalPos[cid].z);
   float curVal;
   while ((curVal = mGlobalPos[cid].w) < id_limit) {
-    if (GPUCommonMath::AtomicCAS(&mGlobalPos[cid].w, curVal, (float)id)) {
+    if (CAMath::AtomicCAS(&mGlobalPos[cid].w, curVal, (float)id)) {
       break;
     }
     curVal = mGlobalPos[cid].w;

Original file line number	Diff line number	Diff line change
`@@ -64,7 +64,7 @@ inline void GPUDisplay::drawPointLinestrip(int32_t iSector, int32_t cid, int32_t`
`64`	`64`	`mVertexBuffer[iSector].emplace_back(mGlobalPos[cid].x, mGlobalPos[cid].y * mYFactor, mCfgH.projectXY ? 0 : mGlobalPos[cid].z);`
`65`	`65`	`float curVal;`
`66`	`66`	`while ((curVal = mGlobalPos[cid].w) < id_limit) {`
`67`		`- if (GPUCommonMath::AtomicCAS(&mGlobalPos[cid].w, curVal, (float)id)) {`
	`67`	`+ if (CAMath::AtomicCAS(&mGlobalPos[cid].w, curVal, (float)id)) {`
`68`	`68`	`break;`
`69`	`69`	`}`
`70`	`70`	`curVal = mGlobalPos[cid].w;`