File tree 4 files changed +3
-17
lines changed
4 files changed +3
-17
lines changed Original file line number Diff line number Diff line change 4
4
// + sm_80 and above uses some native bfloat16 math instructions
5
5
// + below sm_80 always uses generic impls
6
6
7
- // DEFINE: %{mathflags} = %if cl_options %{/clang:-fno-fast-math%} %else %{-fno-fast-math%}
8
- // REQUIRES: aspect-ext_oneapi_bfloat16_math_functions
9
- // RUN: %clangxx -fsycl -fsycl-targets=%{sycl_triple} %if any-device-is-cuda %{ -Xsycl-target-backend --cuda-gpu-arch=sm_80 %} %s -o %t.out %{mathflags}
10
- // RUN: %{run} %t.out
11
-
12
- // Test "new" (ABI breaking) for all platforms ( sm_80/native if CUDA )
13
- // RUN: %if preview-breaking-changes-supported %{ %clangxx -fsycl -fpreview-breaking-changes -fsycl-targets=%{sycl_triple} %if any-device-is-cuda %{ -Xsycl-target-backend --cuda-gpu-arch=sm_80 %} %s -o %t2.out %{mathflags} %}
14
- // RUN: %if preview-breaking-changes-supported %{ %{run} %t2.out %}
15
-
16
- // If CUDA, test "new" again for sm_75/generic
17
- // RUN: %if any-device-is-cuda %{ %if preview-breaking-changes-supported %{ %clangxx -fsycl -fpreview-breaking-changes -fsycl-targets=%{sycl_triple} -Xsycl-target-backend --cuda-gpu-arch=sm_75 %s -o %t3.out %{mathflags} %} %}
18
- // RUN: %if any-device-is-cuda %{ %if preview-breaking-changes-supported %{ %{run} %t3.out %} %}
19
-
20
- // Currently the feature isn't supported on FPGA.
21
- // UNSUPPORTED: accelerator
22
7
#include < sycl/sycl.hpp>
23
8
24
9
#include < cmath>
Original file line number Diff line number Diff line change 5
5
// + below sm_80 always uses generic impls
6
6
7
7
// DEFINE: %{mathflags} = %if cl_options %{/clang:-fno-fast-math%} %else %{-fno-fast-math%}
8
+ // REQUIRES: aspect-ext_oneapi_bfloat16_math_functions
8
9
9
10
// If CUDA, test "new" again for sm_75/generic
10
11
// RUN: %if any-device-is-cuda %{ %if preview-breaking-changes-supported %{ %clangxx -fsycl -fpreview-breaking-changes -fsycl-targets=%{sycl_triple} -Xsycl-target-backend --cuda-gpu-arch=sm_75 %s -o %t3.out %{mathflags} %} %}
Original file line number Diff line number Diff line change 32
32
33
33
// UNSUPPORTED: hip || (windows && level_zero)
34
34
35
- // RUN: %clangxx -std=c++20 -fsycl -fsycl-targets=%{sycl_triple} %if any-device-is-cuda %{ -Xsycl-target-backend --cuda-gpu-arch=sm_70 %} %s -o %t.out
35
+ // RUN: %clangxx -std=c++20 -fsycl -fsycl-targets=%{sycl_triple} %if any-device-is-cuda %{ -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 %} %s -o %t.out
36
36
// RUN: %{run} %t.out
37
37
38
38
#include < sycl/sycl.hpp>
Original file line number Diff line number Diff line change 32
32
33
33
// UNSUPPORTED: hip
34
34
35
- // RUN: %clangxx -fsycl -fsycl-targets=%{sycl_triple} %if any-device-is-cuda %{ -Xsycl-target-backend --cuda-gpu-arch=sm_70 %} %s -o %t.out
35
+ // RUN: %clangxx -fsycl -fsycl-targets=%{sycl_triple} %if any-device-is-cuda %{ -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 %} %s -o %t.out
36
36
// RUN: %{run} %t.out
37
37
38
38
#include < iostream>
You can’t perform that action at this time.
0 commit comments