| 
 | 1 | +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5  | 
 | 2 | +; RUN: llc < %s -mtriple=nvptx64 -mcpu=sm_90 -mattr=+ptx78| FileCheck --check-prefixes=CHECK %s  | 
 | 3 | +; RUN: %if ptxas-12.0 %{ llc < %s -mtriple=nvptx64 -mcpu=sm_90 -mattr=+ptx78| %ptxas-verify -arch=sm_90 %}  | 
 | 4 | + | 
 | 5 | +declare i32 @llvm.nvvm.f2tf32.rn(float %f1)  | 
 | 6 | +declare i32 @llvm.nvvm.f2tf32.rn.relu(float %f1)  | 
 | 7 | +declare i32 @llvm.nvvm.f2tf32.rz(float %f1)  | 
 | 8 | +declare i32 @llvm.nvvm.f2tf32.rz.relu(float %f1)  | 
 | 9 | + | 
 | 10 | +define i32 @cvt_rn_tf32_f32(float %f1) {  | 
 | 11 | +; CHECK-LABEL: cvt_rn_tf32_f32(  | 
 | 12 | +; CHECK:       {  | 
 | 13 | +; CHECK-NEXT:    .reg .b32 %r<2>;  | 
 | 14 | +; CHECK-NEXT:    .reg .f32 %f<2>;  | 
 | 15 | +; CHECK-EMPTY:  | 
 | 16 | +; CHECK-NEXT:  // %bb.0:  | 
 | 17 | +; CHECK-NEXT:    ld.param.f32 %f1, [cvt_rn_tf32_f32_param_0];  | 
 | 18 | +; CHECK-NEXT:    cvt.rn.tf32.f32 %r1, %f1;  | 
 | 19 | +; CHECK-NEXT:    st.param.b32 [func_retval0], %r1;  | 
 | 20 | +; CHECK-NEXT:    ret;  | 
 | 21 | +  %val = call i32 @llvm.nvvm.f2tf32.rn(float %f1)  | 
 | 22 | +  ret i32 %val  | 
 | 23 | +}  | 
 | 24 | + | 
 | 25 | +define i32 @cvt_rn_relu_tf32_f32(float %f1) {  | 
 | 26 | +; CHECK-LABEL: cvt_rn_relu_tf32_f32(  | 
 | 27 | +; CHECK:       {  | 
 | 28 | +; CHECK-NEXT:    .reg .b32 %r<2>;  | 
 | 29 | +; CHECK-NEXT:    .reg .f32 %f<2>;  | 
 | 30 | +; CHECK-EMPTY:  | 
 | 31 | +; CHECK-NEXT:  // %bb.0:  | 
 | 32 | +; CHECK-NEXT:    ld.param.f32 %f1, [cvt_rn_relu_tf32_f32_param_0];  | 
 | 33 | +; CHECK-NEXT:    cvt.rn.relu.tf32.f32 %r1, %f1;  | 
 | 34 | +; CHECK-NEXT:    st.param.b32 [func_retval0], %r1;  | 
 | 35 | +; CHECK-NEXT:    ret;  | 
 | 36 | +  %val = call i32 @llvm.nvvm.f2tf32.rn.relu(float %f1)  | 
 | 37 | +  ret i32 %val  | 
 | 38 | +}  | 
 | 39 | + | 
 | 40 | +define i32 @cvt_rz_tf32_f32(float %f1) {  | 
 | 41 | +; CHECK-LABEL: cvt_rz_tf32_f32(  | 
 | 42 | +; CHECK:       {  | 
 | 43 | +; CHECK-NEXT:    .reg .b32 %r<2>;  | 
 | 44 | +; CHECK-NEXT:    .reg .f32 %f<2>;  | 
 | 45 | +; CHECK-EMPTY:  | 
 | 46 | +; CHECK-NEXT:  // %bb.0:  | 
 | 47 | +; CHECK-NEXT:    ld.param.f32 %f1, [cvt_rz_tf32_f32_param_0];  | 
 | 48 | +; CHECK-NEXT:    cvt.rz.tf32.f32 %r1, %f1;  | 
 | 49 | +; CHECK-NEXT:    st.param.b32 [func_retval0], %r1;  | 
 | 50 | +; CHECK-NEXT:    ret;  | 
 | 51 | +  %val = call i32 @llvm.nvvm.f2tf32.rz(float %f1)  | 
 | 52 | +  ret i32 %val  | 
 | 53 | +}  | 
 | 54 | + | 
 | 55 | +define i32 @cvt_rz_relu_tf32_f32(float %f1) {  | 
 | 56 | +; CHECK-LABEL: cvt_rz_relu_tf32_f32(  | 
 | 57 | +; CHECK:       {  | 
 | 58 | +; CHECK-NEXT:    .reg .b32 %r<2>;  | 
 | 59 | +; CHECK-NEXT:    .reg .f32 %f<2>;  | 
 | 60 | +; CHECK-EMPTY:  | 
 | 61 | +; CHECK-NEXT:  // %bb.0:  | 
 | 62 | +; CHECK-NEXT:    ld.param.f32 %f1, [cvt_rz_relu_tf32_f32_param_0];  | 
 | 63 | +; CHECK-NEXT:    cvt.rz.relu.tf32.f32 %r1, %f1;  | 
 | 64 | +; CHECK-NEXT:    st.param.b32 [func_retval0], %r1;  | 
 | 65 | +; CHECK-NEXT:    ret;  | 
 | 66 | +  %val = call i32 @llvm.nvvm.f2tf32.rz.relu(float %f1)  | 
 | 67 | +  ret i32 %val  | 
 | 68 | +}  | 
0 commit comments