intel
diff --git a/‎sycl/test-e2e/Matrix/SG32/joint_matrix_bf16_fill_k_cache.cpp
Lines changed: 5 additions & 8 deletions b/‎sycl/test-e2e/Matrix/SG32/joint_matrix_bf16_fill_k_cache.cpp
Lines changed: 5 additions & 8 deletions
diff --git a/‎sycl/test-e2e/Matrix/SG32/joint_matrix_bf16_fill_k_cache_init.cpp
Lines changed: 3 additions & 3 deletions b/‎sycl/test-e2e/Matrix/SG32/joint_matrix_bf16_fill_k_cache_init.cpp
Lines changed: 3 additions & 3 deletions
diff --git a/‎sycl/test-e2e/Matrix/SG32/joint_matrix_bf16_fill_k_cache_unroll.cpp
Lines changed: 5 additions & 8 deletions b/‎sycl/test-e2e/Matrix/SG32/joint_matrix_bf16_fill_k_cache_unroll.cpp
Lines changed: 5 additions & 8 deletions
diff --git a/‎sycl/test-e2e/Matrix/SG32/joint_matrix_bf16_fill_k_cache_unroll_init.cpp
Lines changed: 3 additions & 3 deletions b/‎sycl/test-e2e/Matrix/SG32/joint_matrix_bf16_fill_k_cache_unroll_init.cpp
Lines changed: 3 additions & 3 deletions
diff --git a/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_bf16_fill_k_cache.cpp
Lines changed: 0 additions & 20 deletions b/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_bf16_fill_k_cache.cpp
Lines changed: 0 additions & 20 deletions
diff --git a/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_bf16_fill_k_cache_init.cpp
Lines changed: 0 additions & 20 deletions b/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_bf16_fill_k_cache_init.cpp
Lines changed: 0 additions & 20 deletions
diff --git a/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_bf16_fill_k_cache_unroll.cpp
Lines changed: 0 additions & 22 deletions b/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_bf16_fill_k_cache_unroll.cpp
Lines changed: 0 additions & 22 deletions
diff --git a/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_bf16_fill_k_cache_unroll_init.cpp
Lines changed: 0 additions & 22 deletions b/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_bf16_fill_k_cache_unroll_init.cpp
Lines changed: 0 additions & 22 deletions
diff --git a/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_colA_rowB_colC.cpp
Lines changed: 0 additions & 19 deletions b/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_colA_rowB_colC.cpp
Lines changed: 0 additions & 19 deletions
diff --git a/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_out_bounds.cpp
Lines changed: 0 additions & 20 deletions b/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_out_bounds.cpp
Lines changed: 0 additions & 20 deletions
diff --git a/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_unaligned_k.cpp
Lines changed: 0 additions & 20 deletions b/‎sycl/test-e2e/Matrix/XMX8/joint_matrix_unaligned_k.cpp
Lines changed: 0 additions & 20 deletions
diff --git a/‎sycl/test-e2e/Matrix/joint_matrix_bf16_fill_k_cache.cpp
Lines changed: 3 additions & 10 deletions b/‎sycl/test-e2e/Matrix/joint_matrix_bf16_fill_k_cache.cpp
Lines changed: 3 additions & 10 deletions
diff --git a/‎sycl/test-e2e/Matrix/joint_matrix_bf16_fill_k_cache_OOB.cpp
Lines changed: 0 additions & 5 deletions b/‎sycl/test-e2e/Matrix/joint_matrix_bf16_fill_k_cache_OOB.cpp
Lines changed: 0 additions & 5 deletions
@@ -5,21 +5,18 @@
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//
-// REQUIRES: matrix
+// SG size = 32 is not currently supported for SYCL Joint Matrix by IGC on DG2
+// UNSUPPORTED: gpu-intel-dg2
+// REQUIRES: aspect-ext_intel_matrix
 // REQUIRES-INTEL-DRIVER: lin: 27501, win: 101.4943
 
-// RUN: %{build} -o %t_gpu.out -ffp-model=precise
-// RUN: %if gpu %{ %{run} %t_gpu.out %}
-
-// RUN: %{build}  -ffp-model=precise -o %t_cpu.out -DtM=16 -DtK=32 -DNCACHE1=32 -DKCACHE1=32
-// RUN: %if cpu %{ %{run} %t_cpu.out %}
+// RUN: %{build} -o %t.out -ffp-model=precise
+// RUN: %{run} %t.out
 
 // -ffp-model=precise is added to not depend on compiler defaults.
 
 #include "../common.hpp"
-#include <cstddef>
 
 #define SG_SZ 32
-constexpr size_t TN = 16;
 
 #include "../joint_matrix_bf16_fill_k_cache_impl.hpp"
@@ -5,7 +5,9 @@
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//
-// REQUIRES: matrix, gpu
+// SG size = 32 is not currently supported for SYCL Joint Matrix by IGC on DG2
+// UNSUPPORTED: gpu-intel-dg2
+// REQUIRES: aspect-ext_intel_matrix, gpu
 // REQUIRES-INTEL-DRIVER: lin: 27501, win: 101.4943
 
 // RUN: %{build} -o %t.out -DINIT_LIST -ffp-model=precise
@@ -14,9 +16,7 @@
 // -ffp-model=precise is added to not depend on compiler defaults.
 
 #include "../common.hpp"
-#include <cstddef>
 
 #define SG_SZ 32
-constexpr size_t TN = 16;
 
 #include "../joint_matrix_bf16_fill_k_cache_impl.hpp"
@@ -5,23 +5,20 @@
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//
-// REQUIRES: matrix
+// SG size = 32 is not currently supported for SYCL Joint Matrix by IGC on DG2
+// UNSUPPORTED: gpu-intel-dg2
+// REQUIRES: aspect-ext_intel_matrix
 // REQUIRES-INTEL-DRIVER: lin: 27501, win: 101.4943
 
-// RUN: %{build} -mllvm -inline-threshold=5000 -ffp-model=precise -o %t_gpu.out -DMANUAL_UNROLL
-// RUN: %if gpu %{ %{run} %t_gpu.out %}
-
-// RUN: %{build} -mllvm -inline-threshold=5000 -ffp-model=precise -o %t_cpu.out -DMANUAL_UNROLL -DtM=16 -DtK=32 -DNCACHE1=32 -DKCACHE1=32
-// RUN: %if cpu %{ %{run} %t_cpu.out %}
+// RUN: %{build} -mllvm -inline-threshold=5000 -ffp-model=precise -o %t.out -DMANUAL_UNROLL
+// RUN: %{run} %t.out
 
 // -mllvm -inline-threshold added as a workaround,
 // since IGC doesn't support some variants of IR for Joint Matrix currently
 // -ffp-model=precise is added to not depend on compiler defaults.
 
 #include "../common.hpp"
-#include <cstddef>
 
 #define SG_SZ 32
-constexpr size_t TN = 16;
 
 #include "../joint_matrix_bf16_fill_k_cache_impl.hpp"
@@ -5,7 +5,9 @@
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//
-// REQUIRES: matrix, gpu
+// SG size = 32 is not currently supported for SYCL Joint Matrix by IGC on DG2
+// UNSUPPORTED: gpu-intel-dg2
+// REQUIRES: aspect-ext_intel_matrix, gpu
 // REQUIRES-INTEL-DRIVER: lin: 27501, win: 101.4943
 
 // RUN: %{build} -mllvm -inline-threshold=5000 -ffp-model=precise -o %t_gpu.out -DINIT_LIST -DMANUAL_UNROLL
@@ -16,9 +18,7 @@
 // -ffp-model=precise is added to not depend on compiler defaults.
 
 #include "../common.hpp"
-#include <cstddef>
 
 #define SG_SZ 32
-constexpr size_t TN = 16;
 
 #include "../joint_matrix_bf16_fill_k_cache_impl.hpp"
@@ -5,19 +5,12 @@
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//
-// REQUIRES: matrix
+// REQUIRES: aspect-ext_intel_matrix
 
-// RUN: %{build} -o %t_gpu.out -ffp-model=precise
-// RUN: %if gpu %{ %{run} %t_gpu.out %}
-
-// RUN: %{build}  -ffp-model=precise -o %t_cpu.out -DtM=16 -DtK=32 -DNCACHE1=32 -DKCACHE1=32
-// RUN: %if cpu %{ %{run} %t_cpu.out %}
+// RUN: %{build} -o %t.out -ffp-model=precise
+// RUN: %{run} %t.out
 
 // -ffp-model=precise is added to not depend on compiler defaults.
 
 #include "common.hpp"
-#include <cstddef>
-
-constexpr size_t TN = 16;
-
 #include "joint_matrix_bf16_fill_k_cache_impl.hpp"
@@ -16,9 +16,4 @@
 // -ffp-model=precise is added to not depend on compiler defaults.
 
 #include "common.hpp"
-#include <cstddef>
-
-#define SG_SZ 16
-constexpr size_t TN = 16;
-
 #include "joint_matrix_bf16_fill_k_cache_impl.hpp"