Integer-Ctrl
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/ci.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎CMakeLists.txt‎
Lines changed: 2 additions & 3 deletions b/‎CMakeLists.txt‎
Lines changed: 2 additions & 3 deletions
diff --git a/‎src/main/kernels/matmul_16mRest_4nRest_k.cpp‎
Lines changed: 9 additions & 7 deletions b/‎src/main/kernels/matmul_16mRest_4nRest_k.cpp‎
Lines changed: 9 additions & 7 deletions
diff --git a/‎src/test/BaseGeneration.test.h‎
Lines changed: 1 addition & 0 deletions b/‎src/test/BaseGeneration.test.h‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/test/kernels/matmul.test.cpp‎
Lines changed: 114 additions & 0 deletions b/‎src/test/kernels/matmul.test.cpp‎
Lines changed: 114 additions & 0 deletions
diff --git a/‎src/test/kernels/matmul.test.h‎
Lines changed: 63 additions & 54 deletions b/‎src/test/kernels/matmul.test.h‎
Lines changed: 63 additions & 54 deletions
diff --git a/‎src/test/kernels/matmul_16_6_1.test.cpp‎
Lines changed: 2 additions & 2 deletions b/‎src/test/kernels/matmul_16_6_1.test.cpp‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/test/kernels/matmul_16_6_k.test.cpp‎
Lines changed: 4 additions & 4 deletions b/‎src/test/kernels/matmul_16_6_k.test.cpp‎
Lines changed: 4 additions & 4 deletions
@@ -59,5 +59,5 @@ jobs:
         ctest -j ${{env.parallel_processes}} -T memcheck -C ${{matrix.build_type}} --test-dir submission_25_05_01 --output-on-failure
         ctest -j ${{env.parallel_processes}} -T memcheck -C ${{matrix.build_type}} --test-dir submission_25_05_08 --output-on-failure
         ctest -j ${{env.parallel_processes}} -T memcheck -C ${{matrix.build_type}} --test-dir submission_25_05_15 --output-on-failure
-        ctest -j ${{env.parallel_processes}} -T memcheck -C ${{matrix.build_type}} --output-on-failure
+        ctest -j ${{env.parallel_processes}} -T memcheck -C ${{matrix.build_type}} --output-on-failure -E "^Test gemm generation"
 
@@ -121,13 +121,12 @@ set(TEST_FILES
 
 set(TEST_KERNELS
     matmul.test.h
+    matmul.test.cpp
     matmul_16_6_1.test.cpp
     matmul_16_6_k.test.cpp
     matmul_16m_4n_k.test.cpp
     matmul_16m_lt4nRest_k.test.cpp
-    matmul_16mRest_4nRest_k.n1.test.cpp
-    matmul_16mRest_4nRest_k.n2.test.cpp
-    matmul_16mRest_4nRest_k.n3.test.cpp
+    matmul_16mRest_4nRest_k.test.cpp
 )
 
 set(TEST_ARM_INSTRUCTION_FILES
 
@@ -19,13 +19,15 @@ void mini_jit::kernels::matmul_16mRest_4nRest_k(mini_jit::Kernel &kernel, const
   release_assert(n_loop_rest <= 3, "Cannot create a matrix with a rest of n larger than 3!");
 
   // Idea: Division of the matrix into sub-matrices and calculated in the following order.
-  // =====================================================
-  // |                        |                          |
-  // |                        | 2. matmul_16m_lt4nRest_k |
-  // | 1. matmul_16mRest_4n_k |                          |
-  // |                        |--------------------------|
-  // |                        | 3. Rest of m and n       |
-  // =====================================================
+  //                       N dimension
+  // ←---------------------------------------------------→
+  // ===================================================== ↑
+  // |                        |                          | |
+  // |                        | 2. matmul_16m_lt4nRest_k | |
+  // | 1. matmul_16mRest_4n_k |                          | | M dimension
+  // |                        |--------------------------| |
+  // |                        | 3. Rest of m and n       | |
+  // ===================================================== ↓
 
   kernel.add({
     // /**
 
@@ -59,6 +59,7 @@ class GenerationTest
   void verify_matmul(const float *__restrict__ expected, const float *__restrict__ result, uint32_t size);
 
 public:
+  GenerationTest() = delete;
   GenerationTest(uint32_t M, uint32_t N, uint32_t K);
   GenerationTest(uint32_t M, uint32_t N, uint32_t K, uint32_t BatchSize);
   ~GenerationTest();
 
@@ -0,0 +1,114 @@
+#include "matmul.test.h"
+void GemmMxNxKxBatchTestFixture::_RunTest(const uint32_t lda, const uint32_t ldb, const uint32_t ldc, const uint32_t batch_stride_a,
+                                          const uint32_t batch_stride_b)
+{
+  if (native_kernel.get_size() <= 0)
+  {
+    INFO("The kernel should contain instructions before the test is executed.");
+    REQUIRE(native_kernel.get_size() > 0);
+  }
+
+  // Generate executable kernel
+  native_kernel.set_kernel();
+  mini_jit::Brgemm::kernel_t kernel = reinterpret_cast<mini_jit::Brgemm::kernel_t>(
+    const_cast<void *>(native_kernel.get_kernel()));  // Properly cast from const void* to kernel_t
+
+  // Run matmuls
+  kernel(matrix_a, matrix_b, matrix_c, lda, ldb, ldc, batch_stride_a, batch_stride_b);
+  naive_matmul_M_N_K_Batch(matrix_a, matrix_b, matrix_c_verify, lda, ldb, ldc, batch_stride_a, batch_stride_b);
+
+  verify_matmul(matrix_c_verify, matrix_c, M * N);
+};
+
+void GemmMxNxKxBatchTestFixture::fill_random_matrix(float *matrix, uint32_t size)
+{
+  std::srand(std::time(0));
+  for (size_t i = 0; i < size; i++)
+  {
+    matrix[i] = (static_cast<float>(std::rand())) / (static_cast<float>(std::rand()));
+  }
+}
+
+void GemmMxNxKxBatchTestFixture::fill_counting_matrix(float *matrix, uint32_t size)
+{
+  for (size_t i = 0; i < size; i++)
+  {
+    matrix[i] = i;
+  }
+}
+
+void GemmMxNxKxBatchTestFixture::naive_matmul_M_N_K_Batch(const float *__restrict__ a, const float *__restrict__ b, float *__restrict__ c,
+                                                          int64_t lda, int64_t ldb, int64_t ldc, int64_t batch_stride_a,
+                                                          int64_t batch_stride_b)
+{
+  for (size_t iB = 0; iB < BatchSize; iB++)
+  {
+    for (size_t iM = 0; iM < M; iM++)
+    {
+      for (size_t iN = 0; iN < N; iN++)
+      {
+        for (size_t iK = 0; iK < K; ++iK)
+        {
+          c[iM + iN * ldc] += a[iM + iK * lda + iB * batch_stride_a] * b[iK + iN * ldb + iB * batch_stride_b];
+        }
+      }
+    }
+  }
+}
+
+void GemmMxNxKxBatchTestFixture::verify_matmul(const float *__restrict__ expected, const float *__restrict__ result, uint32_t size)
+{
+  for (size_t i = 0; i < size; i++)
+  {
+    CAPTURE(i, result[i], expected[i]);
+    REQUIRE_THAT(result[i], Catch::Matchers::WithinRel(expected[i]));
+  }
+}
+
+GemmMxNxKxBatchTestFixture::GemmMxNxKxBatchTestFixture(uint32_t M, uint32_t N, uint32_t K, uint32_t BatchSize)
+    : M(M), N(N), K(K), BatchSize(BatchSize)
+{
+
+  matrix_a = new float[M * K * BatchSize];
+  matrix_b = new float[K * N * BatchSize];
+  matrix_c = new float[M * N];
+  matrix_c_verify = new float[M * N];
+}
+
+GemmMxNxKxBatchTestFixture::~GemmMxNxKxBatchTestFixture()
+{
+  delete[] matrix_a;
+  delete[] matrix_b;
+  delete[] matrix_c;
+  delete[] matrix_c_verify;
+}
+
+void GemmMxNxKxBatchTestFixture::SetUp(TestInfill fillType)
+{
+  switch (fillType)
+  {
+  case TestInfill::Random:
+    fill_random_matrix(matrix_a, M * K * BatchSize);
+    fill_random_matrix(matrix_b, K * N * BatchSize);
+    fill_random_matrix(matrix_c, M * N);
+    break;
+  case TestInfill::Counting:
+    fill_counting_matrix(matrix_a, M * K * BatchSize);
+    fill_counting_matrix(matrix_b, K * N * BatchSize);
+    fill_counting_matrix(matrix_c, M * N);
+    break;
+  default:
+    FAIL("Undefined infill type found.");
+    break;
+  }
+
+  std::copy(matrix_c, matrix_c + M * N, matrix_c_verify);
+}
+
+GemmMxNxKTestFixture::GemmMxNxKTestFixture(uint32_t M, uint32_t N, uint32_t K) : GemmMxNxKxBatchTestFixture(M, N, K, 1)
+{
+}
+
+GemmMxNxKTestFixture::~GemmMxNxKTestFixture()
+{
+}
@@ -108,46 +108,71 @@ enum class TestInfill
   Counting,
 };
 
-template <uint32_t TMdim, uint32_t TNdim, uint32_t TKdim, uint32_t TBatchDim> class GemmMxNxKxBatchTestFixture
+class GemmMxNxKxBatchTestFixture
 {
+private:
+  uint32_t M;
+  uint32_t N;
+  uint32_t K;
+  uint32_t BatchSize;
+  float *matrix_a;
+  float *matrix_b;
+  float *matrix_c;
+  float *matrix_c_verify;
+
+  /**
+   * @brief Fills the given matrix with random values.
+   *
+   * @param matrix The matrix to fill.
+   * @param size The total size of the matrix.
+   */
+  void fill_random_matrix(float *matrix, uint32_t size);
+
+  /**
+   * @brief Fills the given matrix with counting values starting from 0.
+   *
+   * @param matrix The matrix to fill.
+   * @param size The total size of the matrix.
+   */
+  void fill_counting_matrix(float *matrix, uint32_t size);
+
+  /**
+   * @brief Does a naive matmul for verification usage.
+   *
+   * @param a The a matrix.
+   * @param b The b matrix.
+   * @param c The c matrix.
+   * @param lda The leading dimension of matrix a.
+   * @param ldb The leading dimension of matrix b.
+   * @param ldc The leading dimension of matrix c.
+   * @param batch_stride_a The batch stride of matrix a.
+   * @param batch_stride_b The batch stride of matrix b.
+   */
+  void naive_matmul_M_N_K_Batch(const float *__restrict__ a, const float *__restrict__ b, float *__restrict__ c, int64_t lda, int64_t ldb,
+                                int64_t ldc, int64_t batch_stride_a, int64_t batch_stride_b);
+
+  /**
+   * @brief Compares the two matrices by comparing each values.
+   *
+   * @param expected The matrix results that are expected.
+   * @param result The actual matrix values.
+   * @param size The total size of the matrix.
+   */
+  void verify_matmul(const float *__restrict__ expected, const float *__restrict__ result, uint32_t size);
+
 public:
-  float matrix_a[TMdim * TKdim * TBatchDim];
-  float matrix_b[TKdim * TNdim * TBatchDim];
-  float matrix_c[TMdim * TNdim];
-  float matrix_c_verify[TMdim * TNdim];
-  const uint32_t lda = TMdim;
-  const uint32_t ldb = TKdim;
-  const uint32_t ldc = TMdim;
-  const uint32_t batch_stride_a = TMdim * TKdim;
-  const uint32_t batch_stride_b = TKdim * TNdim;
   mini_jit::Kernel native_kernel;
 
+  GemmMxNxKxBatchTestFixture() = delete;
+  GemmMxNxKxBatchTestFixture(uint32_t M, uint32_t N, uint32_t K, uint32_t BatchSize);
+  ~GemmMxNxKxBatchTestFixture();
+
   /**
    * @brief Set up the test fixture object.
    *
    * @param fillType Fills the matrices with the given infill type.
    */
-  void SetUp(TestInfill fillType)
-  {
-    switch (fillType)
-    {
-    case TestInfill::Random:
-      fill_random_matrix(matrix_a);
-      fill_random_matrix(matrix_b);
-      fill_random_matrix(matrix_c);
-      break;
-    case TestInfill::Counting:
-      fill_counting_matrix(matrix_a);
-      fill_counting_matrix(matrix_b);
-      fill_counting_matrix(matrix_c);
-      break;
-    default:
-      FAIL("Undefined infill type found.");
-      break;
-    }
-
-    copy_matrix(matrix_c, matrix_c_verify);
-  }
+  void SetUp(TestInfill fillType);
 
   /**
    * @brief Executes the Test von an BRGemm with the given input.
@@ -173,36 +198,20 @@ template <uint32_t TMdim, uint32_t TNdim, uint32_t TKdim, uint32_t TBatchDim> cl
    * @param br_stride_a: stride between two A matrices (in elements, not bytes).
    * @param br_stride_b: stride between two B matrices (in elements, not bytes).
    */
-  void _RunTest(const uint32_t lda, const uint32_t ldb, const uint32_t ldc, const uint32_t batch_stride_a, const uint32_t batch_stride_b)
-  {
-    if (native_kernel.get_size() <= 0)
-    {
-      INFO("The kernel should contain instructions before the test is executed.");
-      REQUIRE(native_kernel.get_size() > 0);
-    }
-
-    // Generate executable kernel
-    native_kernel.set_kernel();
-    mini_jit::Brgemm::kernel_t kernel = reinterpret_cast<mini_jit::Brgemm::kernel_t>(
-      const_cast<void *>(native_kernel.get_kernel()));  // Properly cast from const void* to kernel_t
-
-    // Run matmuls
-    kernel(matrix_a, matrix_b, matrix_c, lda, ldb, ldc, batch_stride_a, batch_stride_b);
-    naive_matmul_M_N_K_Batch<TMdim, TNdim, TKdim, TBatchDim>(matrix_a, matrix_b, matrix_c_verify, lda, ldb, ldc, batch_stride_a,
-                                                             batch_stride_b);
-
-    verify_matmul(matrix_c_verify, matrix_c);
-  }
+  void _RunTest(const uint32_t lda, const uint32_t ldb, const uint32_t ldc, const uint32_t batch_stride_a, const uint32_t batch_stride_b);
 };
 
-template <uint32_t TMdim, uint32_t TNdim, uint32_t TKdim>
-class GemmMxNxKTestFixture : public GemmMxNxKxBatchTestFixture<TMdim, TNdim, TKdim, 1>
+class GemmMxNxKTestFixture : public GemmMxNxKxBatchTestFixture
 {
 
   void RunTest(const uint32_t lda, const uint32_t ldb, const uint32_t ldc, const uint32_t batch_stride_a,
                const uint32_t batch_stride_b) = delete;  // delete so not visible in a GemmMxNxKTestFixture object.
 
 public:
+  GemmMxNxKTestFixture() = delete;
+  GemmMxNxKTestFixture(uint32_t M, uint32_t N, uint32_t K);
+  ~GemmMxNxKTestFixture();
+
   /**
    * @brief Executes the Test von an BRGemm with the given input.
    *
@@ -212,7 +221,7 @@ class GemmMxNxKTestFixture : public GemmMxNxKxBatchTestFixture<TMdim, TNdim, TKd
    */
   void RunTest(const uint32_t lda, const uint32_t ldb, const uint32_t ldc)
   {
-    GemmMxNxKxBatchTestFixture<TMdim, TNdim, TKdim, 1>::_RunTest(lda, ldb, ldc, 0, 0);
+    GemmMxNxKxBatchTestFixture::_RunTest(lda, ldb, ldc, 0, 0);
   }
 };
 
 
@@ -5,15 +5,15 @@
 
 TEST_CASE("Test matmul_16_6_1 jited gemm correctness random data", "[jit][correctness][gemm]")
 {
-  GemmMxNxKTestFixture<16, 6, 1> gemmTest;
+  GemmMxNxKTestFixture gemmTest(16, 6, 1);
   gemmTest.SetUp(TestInfill::Random);
   mini_jit::kernels::matmul_16_6_1(gemmTest.native_kernel);
   gemmTest.RunTest(16, 1, 16);
 }
 
 TEST_CASE("Test matmul_16_6_1 jited gemm correctness counting data", "[jit][correctness][gemm]")
 {
-  GemmMxNxKTestFixture<16, 6, 1> gemmTest;
+  GemmMxNxKTestFixture gemmTest(16, 6, 1);
   gemmTest.SetUp(TestInfill::Counting);
   mini_jit::kernels::matmul_16_6_1(gemmTest.native_kernel);
   gemmTest.RunTest(16, 1, 16);
 
@@ -5,31 +5,31 @@
 
 TEST_CASE("Test matmul_16_6_k (M=16, N=6, K=1) jited gemm correctness random data", "[jit][correctness][gemm]")
 {
-  GemmMxNxKTestFixture<16, 6, 1> gemmTest;
+  GemmMxNxKTestFixture gemmTest(16, 6, 1);
   gemmTest.SetUp(TestInfill::Random);
   mini_jit::kernels::matmul_16_6_k(gemmTest.native_kernel, 1);
   gemmTest.RunTest(16, 1, 16);
 }
 
 TEST_CASE("Test matmul_16_6_k (M=16, N=6, K=1) jited gemm correctness counting data", "[jit][correctness][gemm]")
 {
-  GemmMxNxKTestFixture<16, 6, 1> gemmTest;
+  GemmMxNxKTestFixture gemmTest(16, 6, 1);
   gemmTest.SetUp(TestInfill::Counting);
   mini_jit::kernels::matmul_16_6_k(gemmTest.native_kernel, 1);
   gemmTest.RunTest(16, 1, 16);
 }
 
 TEST_CASE("Test matmul_16_6_k (M=16, N=6, K=128) jited gemm correctness random data", "[jit][correctness][gemm]")
 {
-  GemmMxNxKTestFixture<16, 6, 128> gemmTest;
+  GemmMxNxKTestFixture gemmTest(16, 6, 128);
   gemmTest.SetUp(TestInfill::Random);
   mini_jit::kernels::matmul_16_6_k(gemmTest.native_kernel, 128);
   gemmTest.RunTest(16, 128, 16);
 }
 
 TEST_CASE("Test matmul_16_6_k (M=16, N=6, K=128) jited gemm correctness counting data", "[jit][correctness][gemm]")
 {
-  GemmMxNxKTestFixture<16, 6, 128> gemmTest;
+  GemmMxNxKTestFixture gemmTest(16, 6, 128);
   gemmTest.SetUp(TestInfill::Counting);
   mini_jit::kernels::matmul_16_6_k(gemmTest.native_kernel, 128);
   gemmTest.RunTest(16, 128, 16);
Original file line number	Diff line number	Diff line change
`@@ -5,15 +5,15 @@`
`5`	`5`
`6`	`6`	`TEST_CASE("Test matmul_16_6_1 jited gemm correctness random data", "[jit][correctness][gemm]")`
`7`	`7`	`{`
`8`		`- GemmMxNxKTestFixture<16, 6, 1> gemmTest;`
	`8`	`+ GemmMxNxKTestFixture gemmTest(16, 6, 1);`
`9`	`9`	`gemmTest.SetUp(TestInfill::Random);`
`10`	`10`	`mini_jit::kernels::matmul_16_6_1(gemmTest.native_kernel);`
`11`	`11`	`gemmTest.RunTest(16, 1, 16);`
`12`	`12`	`}`
`13`	`13`
`14`	`14`	`TEST_CASE("Test matmul_16_6_1 jited gemm correctness counting data", "[jit][correctness][gemm]")`
`15`	`15`	`{`
`16`		`- GemmMxNxKTestFixture<16, 6, 1> gemmTest;`
	`16`	`+ GemmMxNxKTestFixture gemmTest(16, 6, 1);`
`17`	`17`	`gemmTest.SetUp(TestInfill::Counting);`
`18`	`18`	`mini_jit::kernels::matmul_16_6_1(gemmTest.native_kernel);`
`19`	`19`	`gemmTest.RunTest(16, 1, 16);`
Original file line number	Diff line number	Diff line change
`@@ -5,31 +5,31 @@`
`5`	`5`
`6`	`6`	`TEST_CASE("Test matmul_16_6_k (M=16, N=6, K=1) jited gemm correctness random data", "[jit][correctness][gemm]")`
`7`	`7`	`{`
`8`		`- GemmMxNxKTestFixture<16, 6, 1> gemmTest;`
	`8`	`+ GemmMxNxKTestFixture gemmTest(16, 6, 1);`
`9`	`9`	`gemmTest.SetUp(TestInfill::Random);`
`10`	`10`	`mini_jit::kernels::matmul_16_6_k(gemmTest.native_kernel, 1);`
`11`	`11`	`gemmTest.RunTest(16, 1, 16);`
`12`	`12`	`}`
`13`	`13`
`14`	`14`	`TEST_CASE("Test matmul_16_6_k (M=16, N=6, K=1) jited gemm correctness counting data", "[jit][correctness][gemm]")`
`15`	`15`	`{`
`16`		`- GemmMxNxKTestFixture<16, 6, 1> gemmTest;`
	`16`	`+ GemmMxNxKTestFixture gemmTest(16, 6, 1);`
`17`	`17`	`gemmTest.SetUp(TestInfill::Counting);`
`18`	`18`	`mini_jit::kernels::matmul_16_6_k(gemmTest.native_kernel, 1);`
`19`	`19`	`gemmTest.RunTest(16, 1, 16);`
`20`	`20`	`}`
`21`	`21`
`22`	`22`	`TEST_CASE("Test matmul_16_6_k (M=16, N=6, K=128) jited gemm correctness random data", "[jit][correctness][gemm]")`
`23`	`23`	`{`
`24`		`- GemmMxNxKTestFixture<16, 6, 128> gemmTest;`
	`24`	`+ GemmMxNxKTestFixture gemmTest(16, 6, 128);`
`25`	`25`	`gemmTest.SetUp(TestInfill::Random);`
`26`	`26`	`mini_jit::kernels::matmul_16_6_k(gemmTest.native_kernel, 128);`
`27`	`27`	`gemmTest.RunTest(16, 128, 16);`
`28`	`28`	`}`
`29`	`29`
`30`	`30`	`TEST_CASE("Test matmul_16_6_k (M=16, N=6, K=128) jited gemm correctness counting data", "[jit][correctness][gemm]")`
`31`	`31`	`{`
`32`		`- GemmMxNxKTestFixture<16, 6, 128> gemmTest;`
	`32`	`+ GemmMxNxKTestFixture gemmTest(16, 6, 128);`
`33`	`33`	`gemmTest.SetUp(TestInfill::Counting);`
`34`	`34`	`mini_jit::kernels::matmul_16_6_k(gemmTest.native_kernel, 128);`
`35`	`35`	`gemmTest.RunTest(16, 128, 16);`