|
1 | 1 | ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
|
2 |
| -; ## Some FP16 support but not for abs |
3 |
| -; RUN: llc < %s -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 \ |
4 |
| -; RUN: -O0 -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
5 |
| -; RUN: | FileCheck -allow-deprecated-dag-overlap -check-prefixes CHECK-NOF16 %s |
6 |
| -; RUN: %if ptxas %{ \ |
7 |
| -; RUN: llc < %s -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 \ |
8 |
| -; RUN: -O0 -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
9 |
| -; RUN: | %ptxas-verify -arch=sm_53 \ |
| 2 | + |
| 3 | +; ## FP16 abs is not supported by PTX version (PTX < 65). |
| 4 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx60 \ |
| 5 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 6 | +; RUN: | FileCheck -check-prefix CHECK-NOF16 %s |
| 7 | +; RUN: %if ptxas %{ \ |
| 8 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx60 \ |
| 9 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 10 | +; RUN: | %ptxas-verify -arch=sm_53 \ |
10 | 11 | ; RUN: %}
|
11 | 12 |
|
12 |
| -; ## FP16 support explicitly disabled. |
13 |
| -; RUN: llc < %s -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 \ |
14 |
| -; RUN: -O0 -disable-post-ra -frame-pointer=all --nvptx-no-f16-math \ |
15 |
| -; RUN: -verify-machineinstrs \ |
16 |
| -; RUN: | FileCheck -allow-deprecated-dag-overlap -check-prefixes CHECK-NOF16 %s |
17 |
| -; RUN: %if ptxas %{ \ |
18 |
| -; RUN: llc < %s -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 \ |
19 |
| -; RUN: -O0 -disable-post-ra -frame-pointer=all --nvptx-no-f16-math \ |
20 |
| -; RUN: -verify-machineinstrs \ |
21 |
| -; RUN: | %ptxas-verify -arch=sm_53 \ |
| 13 | +; ## FP16 support explicitly disabled (--nvptx-no-f16-math). |
| 14 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx65 --nvptx-no-f16-math \ |
| 15 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 16 | +; RUN: | FileCheck -check-prefix CHECK-NOF16 %s |
| 17 | +; RUN: %if ptxas %{ \ |
| 18 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx65 --nvptx-no-f16-math \ |
| 19 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 20 | +; RUN: | %ptxas-verify -arch=sm_53 \ |
22 | 21 | ; RUN: %}
|
23 | 22 |
|
24 |
| -; ## FP16 is not supported by hardware. |
25 |
| -; RUN: llc < %s -O0 -mtriple=nvptx64-nvidia-cuda -mcpu=sm_52 \ |
26 |
| -; RUN: -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
27 |
| -; RUN: | FileCheck -allow-deprecated-dag-overlap -check-prefixes CHECK-NOF16 %s |
28 |
| -; RUN: %if ptxas %{ \ |
29 |
| -; RUN: llc < %s -O0 -mtriple=nvptx64-nvidia-cuda -mcpu=sm_52 \ |
30 |
| -; RUN: -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
31 |
| -; RUN: | %ptxas-verify -arch=sm_52 \ |
| 23 | +; ## FP16 is not supported by hardware (SM < 53). |
| 24 | +; RUN: llc < %s -mcpu=sm_52 -mattr=+ptx65 \ |
| 25 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 26 | +; RUN: | FileCheck -check-prefix CHECK-NOF16 %s |
| 27 | +; RUN: %if ptxas %{ \ |
| 28 | +; RUN: llc < %s -mcpu=sm_52 -mattr=+ptx65 \ |
| 29 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 30 | +; RUN: | %ptxas-verify -arch=sm_52 \ |
32 | 31 | ; RUN: %}
|
33 | 32 |
|
34 |
| -; ## Full FP16 support. |
35 |
| -; RUN: llc < %s -O0 -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 -mattr=+ptx70 \ |
36 |
| -; RUN: -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
37 |
| -; RUN: | FileCheck -allow-deprecated-dag-overlap -check-prefixes CHECK-F16-ABS %s |
38 |
| -; RUN: %if ptxas %{ \ |
39 |
| -; RUN: llc < %s -O0 -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 -mattr=+ptx70 \ |
40 |
| -; RUN: -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
41 |
| -; RUN: | %ptxas-verify -arch=sm_53 \ |
| 33 | +; ## Full FP16 abs support. |
| 34 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx65 \ |
| 35 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 36 | +; RUN: | FileCheck -check-prefix CHECK-F16-ABS %s |
| 37 | +; RUN: %if ptxas %{ \ |
| 38 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx65 \ |
| 39 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 40 | +; RUN: | %ptxas-verify -arch=sm_53 \ |
42 | 41 | ; RUN: %}
|
43 | 42 |
|
44 | 43 | target triple = "nvptx64-nvidia-cuda"
|
|
0 commit comments