AliceO2Group
diff --git a/‎Detectors/TPC/calibration/include/TPCCalibration/TPCFastSpaceChargeCorrectionHelper.h‎
Lines changed: 9 additions & 1 deletion b/‎Detectors/TPC/calibration/include/TPCCalibration/TPCFastSpaceChargeCorrectionHelper.h‎
Lines changed: 9 additions & 1 deletion
diff --git a/‎Detectors/TPC/calibration/src/TPCFastSpaceChargeCorrectionHelper.cxx‎
Lines changed: 107 additions & 56 deletions b/‎Detectors/TPC/calibration/src/TPCFastSpaceChargeCorrectionHelper.cxx‎
Lines changed: 107 additions & 56 deletions
diff --git a/‎GPU/TPCFastTransformation/Spline1DSpec.h‎
Lines changed: 39 additions & 49 deletions b/‎GPU/TPCFastTransformation/Spline1DSpec.h‎
Lines changed: 39 additions & 49 deletions
@@ -102,7 +102,15 @@ class TPCFastSpaceChargeCorrectionHelper
   /// initialise inverse transformation from linear combination of several input corrections
   void initInverse(std::vector<o2::gpu::TPCFastSpaceChargeCorrection*>& corrections, const std::vector<float>& scaling, bool prn);
 
-  void MergeCorrections(std::vector<o2::gpu::TPCFastSpaceChargeCorrection*>& corrections, const std::vector<float>& scaling, bool prn);
+  /// merge several corrections
+  /// \param mainCorrection main correction
+  /// \param scale scaling factor for the main correction
+  /// \param additionalCorrections vector of pairs of additional corrections and their scaling factors
+  /// \param prn printout flag
+  /// \return main correction merged with additional corrections
+  void MergeCorrections(
+    o2::gpu::TPCFastSpaceChargeCorrection& mainCorrection, float scale,
+    const std::vector<std::pair<const o2::gpu::TPCFastSpaceChargeCorrection*, float>>& additionalCorrections, bool prn);
 
  private:
   /// geometry initialization
 
@@ -176,8 +176,8 @@ void TPCFastSpaceChargeCorrectionHelper::fillSpaceChargeCorrectionFromMap(TPCFas
         }
 
         if (processingInverseCorrection) {
-          float* splineX = correction.getSplineData(sector, row, 1);
-          float* splineYZ = correction.getSplineData(sector, row, 2);
+          float* splineX = correction.getSplineDataInvX(sector, row);
+          float* splineYZ = correction.getSplineDataInvYZ(sector, row);
           for (int i = 0; i < spline.getNumberOfParameters() / 3; i++) {
             splineX[i] = splineParameters[3 * i + 0];
             splineYZ[2 * i + 0] = splineParameters[3 * i + 1];
@@ -940,8 +940,8 @@ void TPCFastSpaceChargeCorrectionHelper::initInverse(std::vector<o2::gpu::TPCFas
                                      dataPointGridU.data(), dataPointGridV.data(),
                                      dataPointF.data(), nDataPoints);
 
-        float* splineX = correction.getSplineData(sector, row, 1);
-        float* splineUV = correction.getSplineData(sector, row, 2);
+        float* splineX = correction.getSplineDataInvX(sector, row);
+        float* splineUV = correction.getSplineDataInvYZ(sector, row);
         for (int i = 0; i < spline.getNumberOfParameters() / 3; i++) {
           splineX[i] = splineParameters[3 * i + 0];
           splineUV[2 * i + 0] = splineParameters[3 * i + 1];
@@ -967,77 +967,129 @@ void TPCFastSpaceChargeCorrectionHelper::initInverse(std::vector<o2::gpu::TPCFas
   LOGP(info, "Inverse tooks: {}s", duration);
 }
 
-void TPCFastSpaceChargeCorrectionHelper::MergeCorrections(std::vector<o2::gpu::TPCFastSpaceChargeCorrection*>& corrections, const std::vector<float>& scaling, bool prn)
+void TPCFastSpaceChargeCorrectionHelper::MergeCorrections(
+  o2::gpu::TPCFastSpaceChargeCorrection& mainCorrection, float mainScale,
+  const std::vector<std::pair<const o2::gpu::TPCFastSpaceChargeCorrection*, float>>& additionalCorrections, bool /*prn*/)
 {
   /// merge several corrections
-  /*
+
   TStopwatch watch;
   LOG(info) << "fast space charge correction helper: Merge corrections";
 
-  if (corrections.size() != scaling.size()) {
-    LOGP(error, "Input corrections and scaling values have different size");
-    return;
-  }
-
-  auto& correction = *(corrections.front());
+  const auto& geo = mainCorrection.getGeometry();
 
-  for (int sector = 0; sector < mGeo.getNumberOfSectors(); sector++) {
+  for (int sector = 0; sector < geo.getNumberOfSectors(); sector++) {
 
     auto myThread = [&](int iThread) {
-      for (int row = iThread; row < mGeo.getNumberOfRows(); row += mNthreads) {
-        TPCFastSpaceChargeCorrection::SplineType spline = correction.getSpline(sector, row);
+      for (int row = iThread; row < geo.getNumberOfRows(); row += mNthreads) {
+        const auto& spline = mainCorrection.getSpline(sector, row);
 
-        std::vector<float> splineParameters(spline.getNumberOfParameters());
-        std::vector<float> splineParametersInvX(spline.getNumberOfParameters());
-        std::vector<float> splineParametersInvYZ(spline.getNumberOfParameters());
+        float* splineParameters = mainCorrection.getSplineData(sector, row);
+        float* splineParametersInvX = mainCorrection.getSplineDataInvX(sector, row);
+        float* splineParametersInvYZ = mainCorrection.getSplineDataInvYZ(sector, row);
 
-        const auto& gridU = spline.getGridX1();
-        const auto& gridV = spline.getGridX2();
-
-        for (int iu = 0; iu < gridU.getNumberOfKnots(); iu++) {
-          double u = gridU.getKnot(iu).u;
-          for (int iv = 0; iv < gridV.getNumberOfKnots(); iv++) {
-            int knotIndex = spline.getKnotIndex(iu, iv);
+        auto& secRowInfo = mainCorrection.getSectorRowInfo(sector, row);
 
-            double v = gridV.getKnot(iu).u;
-            auto [y, z] = correction.convGridToLocal(sector, row, u, v);
-            constexpr int nKnotPar1d = 4;
-            constexpr int nKnotPar2d = nKnotPar1d * 2;
-            constexpr int nKnotPar3d = nKnotPar1d * 3;
+        constexpr int nKnotPar1d = 4;
+        constexpr int nKnotPar2d = nKnotPar1d * 2;
+        constexpr int nKnotPar3d = nKnotPar1d * 3;
 
-            for (int i = 0; i < corrections.size(); ++i) {
-              double s = scaling[i];
-              auto p = corrections[i]->getCorrectionParameters(sector, row, y, z);
-              for (int j = 0; j < nKnotPar3d; ++j) {
-                splineParameters[knotIndex * nKnotPar3d + j] += s * p[j];
+        { // scale the main correction
+          for (int i = 0; i < 3; i++) {
+            secRowInfo.maxCorr[i] *= mainScale;
+            secRowInfo.minCorr[i] *= mainScale;
+          }
+          double parscale[4] = {mainScale, mainScale, mainScale, mainScale * mainScale};
+          for (int iknot = 0, ind = 0; iknot < spline.getNumberOfKnots(); iknot++) {
+            for (int ipar = 0; ipar < nKnotPar1d; ++ipar) {
+              for (int idim = 0; idim < 3; idim++, ind++) {
+                splineParameters[ind] *= parscale[ipar];
               }
-              auto pInvX = corrections[i]->getCorrectionParametersInvX(sector, row, y, z);
-              for (int j = 0; j < nKnotPar1d; ++j) {
-                splineParametersInvX[knotIndex * nKnotPar1d + j] += s * pInvX[j];
+            }
+          }
+          for (int iknot = 0, ind = 0; iknot < spline.getNumberOfKnots(); iknot++) {
+            for (int ipar = 0; ipar < nKnotPar1d; ++ipar) {
+              for (int idim = 0; idim < 1; idim++, ind++) {
+                splineParametersInvX[ind] *= parscale[ipar];
               }
-              auto pInvYZ = corrections[i]->getCorrectionParametersInvYZ(sector, row, y, z);
-              for (int j = 0; j < nKnotPar2d; ++j) {
-                splineParametersInvYZ[knotIndex * nKnotPar2d + j] += s * pInvYZ[j];
+            }
+          }
+          for (int iknot = 0, ind = 0; iknot < spline.getNumberOfKnots(); iknot++) {
+            for (int ipar = 0; ipar < nKnotPar1d; ++ipar) {
+              for (int idim = 0; idim < 2; idim++, ind++) {
+                splineParametersInvYZ[ind] *= parscale[ipar];
               }
             }
-          } // iv
-        }   // iu
+          }
+        }
 
-        float* splineXYZ = correction.getSplineData(sector, row, 0);
-        float* splineInvX = correction.getSplineData(sector, row, 1);
-        float* splineInvYZ = correction.getSplineData(sector, row, 2);
+        // add the other corrections
 
-        for (int i = 0; i < spline.getNumberOfParameters(); i++) {
-          splineXYZ[i] = splineParameters[i];
-        }
-        for (int i = 0; i < spline.getNumberOfParameters() / 3; i++) {
-          splineX[i] = splineParametersInvX[i];
-          splineYZ[2 * i + 0] = splineParametersInvYZ[2 * i + 0];
-          splineYZ[2 * i + 1] = splineParametersInvYZ[2 * i + 1];
-        }
+        const auto& gridU = spline.getGridX1();
+        const auto& gridV = spline.getGridX2();
+
+        for (int icorr = 0; icorr < additionalCorrections.size(); ++icorr) {
+          const auto& corr = *(additionalCorrections[icorr].first);
+          double scale = additionalCorrections[icorr].second;
+          auto& linfo = corr.getSectorRowInfo(sector, row);
+          secRowInfo.updateMaxValues(linfo.getMaxValues(), scale);
+          secRowInfo.updateMaxValues(linfo.getMinValues(), scale);
+
+          double scaleU = secRowInfo.scaleUtoGrid / linfo.scaleUtoGrid;
+          double scaleV = secRowInfo.scaleVtoGrid / linfo.scaleVtoGrid;
+
+          for (int iu = 0; iu < gridU.getNumberOfKnots(); iu++) {
+            double u = gridU.getKnot(iu).u;
+            for (int iv = 0; iv < gridV.getNumberOfKnots(); iv++) {
+              double v = gridV.getKnot(iu).u;
+              int knotIndex = spline.getKnotIndex(iu, iv);
+              float P[nKnotPar3d];
+
+              { // direct correction
+                auto [y, z] = mainCorrection.convGridToLocal(sector, row, u, v);
+                // return values: u, v, scaling factor
+                auto [lu, lv, ls] = corr.convLocalToGrid(sector, row, y, z);
+                ls *= scale;
+                double parscale[4] = {ls, ls * scaleU, ls * scaleV, ls * ls * scaleU * scaleV};
+                const auto& spl = corr.getSpline(sector, row);
+                spl.interpolateParametersAtU(corr.getSplineData(sector, row), lu, lv, P);
+                for (int ipar = 0, ind = 0; ipar < nKnotPar1d; ++ipar) {
+                  for (int idim = 0; idim < 3; idim++, ind++) {
+                    splineParameters[knotIndex * nKnotPar3d + ind] += parscale[ipar] * P[ind];
+                  }
+                }
+              }
+
+              auto [y, z] = mainCorrection.convGridToCorrectedLocal(sector, row, u, v);
+              // return values: u, v, scaling factor
+              auto [lu, lv, ls] = corr.convCorrectedLocalToGrid(sector, row, y, z);
+              ls *= scale;
+              double parscale[4] = {ls, ls * scaleU, ls * scaleV, ls * ls * scaleU * scaleV};
+
+              { // inverse X correction
+                corr.getSplineInvX(sector, row).interpolateParametersAtU(corr.getSplineDataInvX(sector, row), lu, lv, P);
+                for (int ipar = 0, ind = 0; ipar < nKnotPar1d; ++ipar) {
+                  for (int idim = 0; idim < 1; idim++, ind++) {
+                    splineParametersInvX[knotIndex * nKnotPar1d + ind] += parscale[ipar] * P[ind];
+                  }
+                }
+              }
+
+              { // inverse YZ correction
+                corr.getSplineInvYZ(sector, row).interpolateParametersAtU(corr.getSplineDataInvYZ(sector, row), lu, lv, P);
+                for (int ipar = 0, ind = 0; ipar < nKnotPar1d; ++ipar) {
+                  for (int idim = 0; idim < 2; idim++, ind++) {
+                    splineParametersInvYZ[knotIndex * nKnotPar2d + ind] += parscale[ipar] * P[ind];
+                  }
+                }
+              }
+
+            } // iv
+          } // iu
+        } // corrections
 
       } // row
-    };  // thread
+    }; // thread
 
     std::vector<std::thread> threads(mNthreads);
 
@@ -1054,7 +1106,6 @@ void TPCFastSpaceChargeCorrectionHelper::MergeCorrections(std::vector<o2::gpu::T
   } // sector
   float duration = watch.RealTime();
   LOGP(info, "Merge of corrections tooks: {}s", duration);
-  */
 }
 
 } // namespace tpc
 
@@ -318,7 +318,10 @@ class Spline1DSpec<DataT, YdimT, 0> : public Spline1DContainer<DataT>
     for (int32_t dim = 0; dim < nYdim; ++dim) {
       S[dim] = dSdSr * Sr[dim] + dSdSl * Sl[dim] + dSdDl * Dl[dim] + dSdDr * Dr[dim];
     }
+
     /*
+    another way to calculate f(u):
+
     if (u < (DataT)0) {
       u = (DataT)0;
     }
@@ -336,18 +339,6 @@ class Spline1DSpec<DataT, YdimT, 0> : public Spline1DContainer<DataT>
       S[dim] = ((a * v + b) * v + Dl[dim]) * uu + Sl[dim];
     }
     */
-    /*
-     another way to calculate f(u):
-     T uu = T(u - knotL.u);
-     T v = uu * T(knotL.Li); // scaled u
-     T vm1 = v-1;
-     T v2 = v * v;
-     float cSr = v2*(3-2*v);
-     float cSl = 1-cSr;
-     float cDl = v*vm1*vm1*knotL.L;
-     float cDr = v2*vm1*knotL.L;
-     return cSl*Sl + cSr*Sr + cDl*Dl + cDr*Dr;
-    */
   }
 
   template <typename T>
@@ -365,51 +356,50 @@ class Spline1DSpec<DataT, YdimT, 0> : public Spline1DContainer<DataT>
 
     u = u - knotL.u;
     T v = u * T(knotL.Li); // scaled u
-    T vm1 = v - 1.;
+    T vm1 = v - T(1.);
     T a = u * vm1;
     T v2 = v * v;
-    T dSdSr = v2 * (3. - 2 * v);
-    T dSdSl = 1. - dSdSr;
+    T dSdSr = v2 * (T(3.) - v - v);
+    T dSdSl = T(1.) - dSdSr;
     T dSdDl = vm1 * a;
     T dSdDr = v * a;
     // S(u) = dSdSl * Sl + dSdSr * Sr + dSdDl * Dl + dSdDr * Dr;
     return std::make_tuple(dSdSl, dSdDl, dSdSr, dSdDr);
   }
-  /*
-    template <typename T>
-    GPUd() void getUsecondDerivatives(const Knot& knotL, DataT u,
-                                      T& dSl, T& dDl, T& dSr, T& dDr,
-                                      T& dSl2, T& dDl2, T& dSr2, T& dDr2) const
-    {
-      /// Get derivatives of the interpolated value {S(u): 1D -> nYdim} at the segment [knotL, next knotR]
-      /// over the spline values Sl, Sr and the slopes Dl, Dr
-
-      if (u < (DataT)0) {
-        u = (DataT)0;
-      }
-      if (u > (DataT)TBase::getUmax()) {
-        u = (DataT)TBase::getUmax();
-      }
-
-      u = u - knotL.u;
-      T v = u * T(knotL.Li); // scaled u
-      T vm1 = v - 1.;
-      T a = u * vm1;
-      T v2 = v * v;
-      dSr = v2 * (3. - 2 * v);
-      dSl = 1. - dSr;
-      dDl = vm1 * a;
-      dDr = v * a;
-      T dv = T(knotL.Li);
-      dSr2 = 6. * v * (1. - v) * dv;
-      dSl2 = -dSr2;
-      dDl2 = (v - 1) * (3 * v - 1);
-      dDr = u * (v * v - v);
-      dDr2 = 3.f * v * v - 2.f * v;
-      // F(u) = dSl * Sl + dSr * Sr + dDl * Dl + dDr * Dr;
-      // dF(u)/du = dSl2 * Sl + dSr2 * Sr + dDl2 * Dl + dDr2 * Dr;
+
+  template <typename T>
+  GPUd() std::tuple<T, T, T, T, T, T, T, T> getSDderivativesOverParsAtU(const Knot& knotL, DataT u) const
+  {
+    /// Get derivatives of the interpolated value {S(u): 1D -> nYdim} at the segment [knotL, next knotR]
+    /// over the spline values Sl, Sr and the slopes Dl, Dr
+
+    if (u < (DataT)0) {
+      u = (DataT)0;
     }
-  */
+    if (u > (DataT)TBase::getUmax()) {
+      u = (DataT)TBase::getUmax();
+    }
+
+    u = u - knotL.u;
+    T v = u * T(knotL.Li); // scaled u
+    T vm1 = v - T(1.);
+    T a = u * vm1;
+    T v2 = v * v;
+    T dSdSr = v2 * (T(3.) - v - v);
+    T dSdSl = T(1.) - dSdSr;
+    T dSdDl = vm1 * a;
+    T dSdDr = v * a;
+
+    T dv = T(knotL.Li);
+    T dDdSr = 6. * v * (T(1.) - v) * dv;
+    T dDdSl = -dDdSr;
+    T dDdDl = vm1 * (v + v + vm1);
+    T dDdDr = v * (v + vm1 + vm1);
+    // S(u) = dSdSl * Sl + dSdSr * Sr + dSdDl * Dl + dSdDr * Dr;
+    // D(u) = dS(u)/du = dDdSl * Sl + dDdSr * Sr + dDdDl * Dl + dDdDr * Dr;
+    return std::make_tuple(dSdSl, dSdDl, dSdSr, dSdDr, dDdSl, dDdDl, dDdSr, dDdDr);
+  }
+
   using TBase::convXtoU;
   using TBase::getKnot;
   using TBase::getKnots;