File tree 4 files changed +22
-4
lines changed
test/tools/sycl-post-link/device-code-split
sycl/test-e2e/KernelAndProgram
4 files changed +22
-4
lines changed Original file line number Diff line number Diff line change @@ -113,7 +113,8 @@ bool isGenericBuiltin(StringRef FName) {
113
113
}
114
114
115
115
bool isKernel (const Function &F) {
116
- return F.getCallingConv () == CallingConv::SPIR_KERNEL;
116
+ return F.getCallingConv () == CallingConv::SPIR_KERNEL ||
117
+ F.getCallingConv () == CallingConv::AMDGPU_KERNEL;
117
118
}
118
119
119
120
bool isEntryPoint (const Function &F, bool EmitOnlyKernelsAsEntryPoints) {
Original file line number Diff line number Diff line change
1
+ ; -- Per-kernel split
2
+ ; RUN: sycl-post-link -split=kernel -emit-only-kernels-as-entry-points -S < %s -o %tC.table
3
+ ; RUN: FileCheck %s -input-file=%tC_0.ll --check-prefixes CHECK-A0
4
+ ; RUN: FileCheck %s -input-file=%tC_1.ll --check-prefixes CHECK-A1
5
+
6
+ define dso_local amdgpu_kernel void @Kernel1 () {
7
+ ret void
8
+ }
9
+
10
+ define dso_local amdgpu_kernel void @Kernel2 () {
11
+ ret void
12
+ }
13
+
14
+ ; CHECK-A0: define dso_local amdgpu_kernel void @Kernel2()
15
+ ; CHECK-A0-NOT: define dso_local amdgpu_kernel void @Kernel1()
16
+ ; CHECK-A1-NOT: define dso_local amdgpu_kernel void @Kernel2()
17
+ ; CHECK-A1: define dso_local amdgpu_kernel void @Kernel1()
Original file line number Diff line number Diff line change 3
3
// RUN: %{run} %t.out
4
4
5
5
// The name mangling for free function kernels currently does not work with PTX.
6
- // UNSUPPORTED: cuda, hip
6
+ // UNSUPPORTED: cuda
7
7
8
8
#include < iostream>
9
9
#include < sycl/detail/core.hpp>
Original file line number Diff line number Diff line change 3
3
// RUN: %{run} %t.out
4
4
5
5
// The name mangling for free function kernels currently does not work with PTX.
6
- // UNSUPPORTED: cuda, hip
6
+ // UNSUPPORTED: cuda
7
7
8
8
// This test tests free function kernel code generation and execution.
9
9
@@ -212,7 +212,7 @@ SYCL_EXTERNAL SYCL_EXT_ONEAPI_FUNCTION_PROPERTY((
212
212
ptr2D[GId.get (0 )][GId.get (1 )] = LId.get (0 ) + LId.get (1 ) + start;
213
213
}
214
214
215
- // Explicit instantiation with “int*”.
215
+ // Explicit instantiation with “int*”.
216
216
template void ff_3 (int *ptr, int start);
217
217
218
218
bool test_3 (queue Queue) {
You can’t perform that action at this time.
0 commit comments