@@ -1244,45 +1244,45 @@ __device__ void nvvm_cvt_sm100a_sm103a() {
12441244// CHECK_PTX87_SM103a: call <2 x bfloat> @llvm.nvvm.ff2bf16x2.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, i32 0)
12451245 __nvvm_ff2bf16x2_rs_relu_satfinite (1.0f , 1.0f , 0 );
12461246
1247- // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.ff .to.e4m3x4.rs.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1248- // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.ff .to.e4m3x4.rs.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1249- __nvvm_ff_to_e4m3x4_rs_satfinite ( 1.0f , 1.0f , 1.0f , 1.0f , 0 );
1247+ // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.f32x4 .to.e4m3x4.rs.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1248+ // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.f32x4 .to.e4m3x4.rs.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1249+ __nvvm_f32x4_to_e4m3x4_rs_satfinite ({ 1.0f , 1.0f , 1.0f , 1.0f } , 0 );
12501250
1251- // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.ff .to.e4m3x4.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1252- // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.ff .to.e4m3x4.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1253- __nvvm_ff_to_e4m3x4_rs_relu_satfinite ( 1.0f , 1.0f , 1.0f , 1.0f , 0 );
1251+ // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.f32x4 .to.e4m3x4.rs.relu.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1252+ // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.f32x4 .to.e4m3x4.rs.relu.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1253+ __nvvm_f32x4_to_e4m3x4_rs_relu_satfinite ({ 1.0f , 1.0f , 1.0f , 1.0f } , 0 );
12541254
1255- // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.ff .to.e5m2x4.rs.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1256- // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.ff .to.e5m2x4.rs.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1257- __nvvm_ff_to_e5m2x4_rs_satfinite ( 1.0f , 1.0f , 1.0f , 1.0f , 0 );
1255+ // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.f32x4 .to.e5m2x4.rs.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1256+ // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.f32x4 .to.e5m2x4.rs.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1257+ __nvvm_f32x4_to_e5m2x4_rs_satfinite ({ 1.0f , 1.0f , 1.0f , 1.0f } , 0 );
12581258
1259- // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.ff .to.e5m2x4.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1260- // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.ff .to.e5m2x4.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1261- __nvvm_ff_to_e5m2x4_rs_relu_satfinite ( 1.0f , 1.0f , 1.0f , 1.0f , 0 );
1259+ // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.f32x4 .to.e5m2x4.rs.relu.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1260+ // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.f32x4 .to.e5m2x4.rs.relu.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1261+ __nvvm_f32x4_to_e5m2x4_rs_relu_satfinite ({ 1.0f , 1.0f , 1.0f , 1.0f } , 0 );
12621262
1263- // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.ff .to.e2m3x4.rs.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1264- // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.ff .to.e2m3x4.rs.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1265- __nvvm_ff_to_e2m3x4_rs_satfinite ( 1.0f , 1.0f , 1.0f , 1.0f , 0 );
1263+ // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.f32x4 .to.e2m3x4.rs.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1264+ // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.f32x4 .to.e2m3x4.rs.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1265+ __nvvm_f32x4_to_e2m3x4_rs_satfinite ({ 1.0f , 1.0f , 1.0f , 1.0f } , 0 );
12661266
1267- // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.ff .to.e2m3x4.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1268- // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.ff .to.e2m3x4.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1269- __nvvm_ff_to_e2m3x4_rs_relu_satfinite ( 1.0f , 1.0f , 1.0f , 1.0f , 0 );
1267+ // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.f32x4 .to.e2m3x4.rs.relu.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1268+ // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.f32x4 .to.e2m3x4.rs.relu.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1269+ __nvvm_f32x4_to_e2m3x4_rs_relu_satfinite ({ 1.0f , 1.0f , 1.0f , 1.0f } , 0 );
12701270
1271- // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.ff .to.e3m2x4.rs.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1272- // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.ff .to.e3m2x4.rs.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1273- __nvvm_ff_to_e3m2x4_rs_satfinite ( 1.0f , 1.0f , 1.0f , 1.0f , 0 );
1271+ // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.f32x4 .to.e3m2x4.rs.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1272+ // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.f32x4 .to.e3m2x4.rs.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1273+ __nvvm_f32x4_to_e3m2x4_rs_satfinite ({ 1.0f , 1.0f , 1.0f , 1.0f } , 0 );
12741274
1275- // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.ff .to.e3m2x4.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1276- // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.ff .to.e3m2x4.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1277- __nvvm_ff_to_e3m2x4_rs_relu_satfinite ( 1.0f , 1.0f , 1.0f , 1.0f , 0 );
1275+ // CHECK_PTX87_SM100a: call <4 x i8> @llvm.nvvm.f32x4 .to.e3m2x4.rs.relu.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1276+ // CHECK_PTX87_SM103a: call <4 x i8> @llvm.nvvm.f32x4 .to.e3m2x4.rs.relu.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1277+ __nvvm_f32x4_to_e3m2x4_rs_relu_satfinite ({ 1.0f , 1.0f , 1.0f , 1.0f } , 0 );
12781278
1279- // CHECK_PTX87_SM100a: call i16 @llvm.nvvm.ff .to.e2m1x4.rs.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1280- // CHECK_PTX87_SM103a: call i16 @llvm.nvvm.ff .to.e2m1x4.rs.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1281- __nvvm_ff_to_e2m1x4_rs_satfinite ( 1.0f , 1.0f , 1.0f , 1.0f , 0 );
1279+ // CHECK_PTX87_SM100a: call i16 @llvm.nvvm.f32x4 .to.e2m1x4.rs.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1280+ // CHECK_PTX87_SM103a: call i16 @llvm.nvvm.f32x4 .to.e2m1x4.rs.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1281+ __nvvm_f32x4_to_e2m1x4_rs_satfinite ({ 1.0f , 1.0f , 1.0f , 1.0f } , 0 );
12821282
1283- // CHECK_PTX87_SM100a: call i16 @llvm.nvvm.ff .to.e2m1x4.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1284- // CHECK_PTX87_SM103a: call i16 @llvm.nvvm.ff .to.e2m1x4.rs.relu.satfinite(float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00 , i32 0)
1285- __nvvm_ff_to_e2m1x4_rs_relu_satfinite ( 1.0f , 1.0f , 1.0f , 1.0f , 0 );
1283+ // CHECK_PTX87_SM100a: call i16 @llvm.nvvm.f32x4 .to.e2m1x4.rs.relu.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1284+ // CHECK_PTX87_SM103a: call i16 @llvm.nvvm.f32x4 .to.e2m1x4.rs.relu.satfinite(<4 x float> splat ( float 1.000000e+00) , i32 0)
1285+ __nvvm_f32x4_to_e2m1x4_rs_relu_satfinite ({ 1.0f , 1.0f , 1.0f , 1.0f } , 0 );
12861286#endif
12871287}
12881288
0 commit comments