|
1 | 1 | ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 |
2 | | -; ## Some FP16 support but not for abs |
3 | | -; RUN: llc < %s -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 \ |
4 | | -; RUN: -O0 -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
5 | | -; RUN: | FileCheck -allow-deprecated-dag-overlap -check-prefixes CHECK-NOF16 %s |
6 | | -; RUN: %if ptxas %{ \ |
7 | | -; RUN: llc < %s -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 \ |
8 | | -; RUN: -O0 -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
9 | | -; RUN: | %ptxas-verify -arch=sm_53 \ |
| 2 | + |
| 3 | +; ## FP16 abs is not supported by PTX version (PTX < 65). |
| 4 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx60 \ |
| 5 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 6 | +; RUN: | FileCheck -check-prefix CHECK-NOF16 %s |
| 7 | +; RUN: %if ptxas %{ \ |
| 8 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx60 \ |
| 9 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 10 | +; RUN: | %ptxas-verify -arch=sm_53 \ |
10 | 11 | ; RUN: %} |
11 | 12 |
|
12 | | -; ## FP16 support explicitly disabled. |
13 | | -; RUN: llc < %s -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 \ |
14 | | -; RUN: -O0 -disable-post-ra -frame-pointer=all --nvptx-no-f16-math \ |
15 | | -; RUN: -verify-machineinstrs \ |
16 | | -; RUN: | FileCheck -allow-deprecated-dag-overlap -check-prefixes CHECK-NOF16 %s |
17 | | -; RUN: %if ptxas %{ \ |
18 | | -; RUN: llc < %s -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 \ |
19 | | -; RUN: -O0 -disable-post-ra -frame-pointer=all --nvptx-no-f16-math \ |
20 | | -; RUN: -verify-machineinstrs \ |
21 | | -; RUN: | %ptxas-verify -arch=sm_53 \ |
| 13 | +; ## FP16 support explicitly disabled (--nvptx-no-f16-math). |
| 14 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx65 --nvptx-no-f16-math \ |
| 15 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 16 | +; RUN: | FileCheck -check-prefix CHECK-NOF16 %s |
| 17 | +; RUN: %if ptxas %{ \ |
| 18 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx65 --nvptx-no-f16-math \ |
| 19 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 20 | +; RUN: | %ptxas-verify -arch=sm_53 \ |
22 | 21 | ; RUN: %} |
23 | 22 |
|
24 | | -; ## FP16 is not supported by hardware. |
25 | | -; RUN: llc < %s -O0 -mtriple=nvptx64-nvidia-cuda -mcpu=sm_52 \ |
26 | | -; RUN: -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
27 | | -; RUN: | FileCheck -allow-deprecated-dag-overlap -check-prefixes CHECK-NOF16 %s |
28 | | -; RUN: %if ptxas %{ \ |
29 | | -; RUN: llc < %s -O0 -mtriple=nvptx64-nvidia-cuda -mcpu=sm_52 \ |
30 | | -; RUN: -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
31 | | -; RUN: | %ptxas-verify -arch=sm_52 \ |
| 23 | +; ## FP16 is not supported by hardware (SM < 53). |
| 24 | +; RUN: llc < %s -mcpu=sm_52 -mattr=+ptx65 \ |
| 25 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 26 | +; RUN: | FileCheck -check-prefix CHECK-NOF16 %s |
| 27 | +; RUN: %if ptxas %{ \ |
| 28 | +; RUN: llc < %s -mcpu=sm_52 -mattr=+ptx65 \ |
| 29 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 30 | +; RUN: | %ptxas-verify -arch=sm_52 \ |
32 | 31 | ; RUN: %} |
33 | 32 |
|
34 | | -; ## Full FP16 support. |
35 | | -; RUN: llc < %s -O0 -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 -mattr=+ptx70 \ |
36 | | -; RUN: -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
37 | | -; RUN: | FileCheck -allow-deprecated-dag-overlap -check-prefixes CHECK-F16-ABS %s |
38 | | -; RUN: %if ptxas %{ \ |
39 | | -; RUN: llc < %s -O0 -mtriple=nvptx64-nvidia-cuda -mcpu=sm_53 -mattr=+ptx70 \ |
40 | | -; RUN: -disable-post-ra -frame-pointer=all -verify-machineinstrs \ |
41 | | -; RUN: | %ptxas-verify -arch=sm_53 \ |
| 33 | +; ## Full FP16 abs support. |
| 34 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx65 \ |
| 35 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 36 | +; RUN: | FileCheck -check-prefix CHECK-F16-ABS %s |
| 37 | +; RUN: %if ptxas %{ \ |
| 38 | +; RUN: llc < %s -mcpu=sm_53 -mattr=+ptx65 \ |
| 39 | +; RUN: -O0 -disable-post-ra -verify-machineinstrs \ |
| 40 | +; RUN: | %ptxas-verify -arch=sm_53 \ |
42 | 41 | ; RUN: %} |
43 | 42 |
|
44 | 43 | target triple = "nvptx64-nvidia-cuda" |
|
0 commit comments