@@ -579,19 +579,35 @@ def __nvvm_ff2bf16x2_rn : NVPTXBuiltinSMAndPTX<"_Vector<2, __bf16>(float, float)
579579def __nvvm_ff2bf16x2_rn_relu : NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float)" , SM_80, PTX70>;
580580def __nvvm_ff2bf16x2_rz : NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float)" , SM_80, PTX70>;
581581def __nvvm_ff2bf16x2_rz_relu : NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float)" , SM_80, PTX70>;
582- def __nvvm_ff2bf16x2_rs : NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
583- def __nvvm_ff2bf16x2_rs_relu : NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
584- def __nvvm_ff2bf16x2_rs_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
585- def __nvvm_ff2bf16x2_rs_relu_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
582+ def __nvvm_ff2bf16x2_rs :
583+ NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float, uint32_t)" ,
584+ SM<" 100a" , [SM_103a]>, PTX87>;
585+ def __nvvm_ff2bf16x2_rs_relu :
586+ NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float, uint32_t)" ,
587+ SM<" 100a" , [SM_103a]>, PTX87>;
588+ def __nvvm_ff2bf16x2_rs_satfinite :
589+ NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float, uint32_t)" ,
590+ SM<" 100a" , [SM_103a]>, PTX87>;
591+ def __nvvm_ff2bf16x2_rs_relu_satfinite :
592+ NVPTXBuiltinSMAndPTX<" _Vector<2, __bf16>(float, float, uint32_t)" ,
593+ SM<" 100a" , [SM_103a]>, PTX87>;
586594
587595def __nvvm_ff2f16x2_rn : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float)" , SM_80, PTX70>;
588596def __nvvm_ff2f16x2_rn_relu : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float)" , SM_80, PTX70>;
589597def __nvvm_ff2f16x2_rz : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float)" , SM_80, PTX70>;
590598def __nvvm_ff2f16x2_rz_relu : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float)" , SM_80, PTX70>;
591- def __nvvm_ff2f16x2_rs : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
592- def __nvvm_ff2f16x2_rs_relu : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
593- def __nvvm_ff2f16x2_rs_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
594- def __nvvm_ff2f16x2_rs_relu_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
599+ def __nvvm_ff2f16x2_rs :
600+ NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float, uint32_t)" ,
601+ SM<" 100a" , [SM_103a]>, PTX87>;
602+ def __nvvm_ff2f16x2_rs_relu :
603+ NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float, uint32_t)" ,
604+ SM<" 100a" , [SM_103a]>, PTX87>;
605+ def __nvvm_ff2f16x2_rs_satfinite :
606+ NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float, uint32_t)" ,
607+ SM<" 100a" , [SM_103a]>, PTX87>;
608+ def __nvvm_ff2f16x2_rs_relu_satfinite :
609+ NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(float, float, uint32_t)" ,
610+ SM<" 100a" , [SM_103a]>, PTX87>;
595611
596612def __nvvm_f2bf16_rn : NVPTXBuiltinSMAndPTX<" __bf16(float)" , SM_80, PTX70>;
597613def __nvvm_f2bf16_rn_relu : NVPTXBuiltinSMAndPTX<" __bf16(float)" , SM_80, PTX70>;
@@ -624,10 +640,18 @@ def __nvvm_e4m3x2_to_f16x2_rn_relu : NVPTXBuiltinSMAndPTX<"_Vector<2, __fp16>(sh
624640def __nvvm_e5m2x2_to_f16x2_rn : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(short)" , SM_89, PTX81>;
625641def __nvvm_e5m2x2_to_f16x2_rn_relu : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(short)" , SM_89, PTX81>;
626642
627- def __nvvm_f32x4_to_e4m3x4_rs_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
628- def __nvvm_f32x4_to_e4m3x4_rs_relu_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
629- def __nvvm_f32x4_to_e5m2x4_rs_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
630- def __nvvm_f32x4_to_e5m2x4_rs_relu_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
643+ def __nvvm_f32x4_to_e4m3x4_rs_satfinite :
644+ NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" ,
645+ SM<" 100a" , [SM_103a]>, PTX87>;
646+ def __nvvm_f32x4_to_e4m3x4_rs_relu_satfinite :
647+ NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" ,
648+ SM<" 100a" , [SM_103a]>, PTX87>;
649+ def __nvvm_f32x4_to_e5m2x4_rs_satfinite :
650+ NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" ,
651+ SM<" 100a" , [SM_103a]>, PTX87>;
652+ def __nvvm_f32x4_to_e5m2x4_rs_relu_satfinite :
653+ NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" ,
654+ SM<" 100a" , [SM_103a]>, PTX87>;
631655
632656def __nvvm_ff_to_e2m3x2_rn_satfinite : NVPTXBuiltinSMAndPTX<" short(float, float)" , SM<" 100a" , [SM_101a, SM_120a]>, PTX86>;
633657def __nvvm_ff_to_e2m3x2_rn_relu_satfinite : NVPTXBuiltinSMAndPTX<" short(float, float)" , SM<" 100a" , [SM_101a, SM_120a]>, PTX86>;
@@ -639,19 +663,31 @@ def __nvvm_e2m3x2_to_f16x2_rn_relu : NVPTXBuiltinSMAndPTX<"_Vector<2, __fp16>(sh
639663def __nvvm_e3m2x2_to_f16x2_rn : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(short)" , SM<" 100a" , [SM_101a, SM_120a]>, PTX86>;
640664def __nvvm_e3m2x2_to_f16x2_rn_relu : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(short)" , SM<" 100a" , [SM_101a, SM_120a]>, PTX86>;
641665
642- def __nvvm_f32x4_to_e2m3x4_rs_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
643- def __nvvm_f32x4_to_e2m3x4_rs_relu_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
644- def __nvvm_f32x4_to_e3m2x4_rs_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
645- def __nvvm_f32x4_to_e3m2x4_rs_relu_satfinite : NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
666+ def __nvvm_f32x4_to_e2m3x4_rs_satfinite :
667+ NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" ,
668+ SM<" 100a" , [SM_103a]>, PTX87>;
669+ def __nvvm_f32x4_to_e2m3x4_rs_relu_satfinite :
670+ NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" ,
671+ SM<" 100a" , [SM_103a]>, PTX87>;
672+ def __nvvm_f32x4_to_e3m2x4_rs_satfinite :
673+ NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" ,
674+ SM<" 100a" , [SM_103a]>, PTX87>;
675+ def __nvvm_f32x4_to_e3m2x4_rs_relu_satfinite :
676+ NVPTXBuiltinSMAndPTX<" _Vector<4, char>(_Vector<4, float>, uint32_t)" ,
677+ SM<" 100a" , [SM_103a]>, PTX87>;
646678
647679def __nvvm_ff_to_e2m1x2_rn_satfinite : NVPTXBuiltinSMAndPTX<" short(float, float)" , SM<" 100a" , [SM_101a, SM_120a]>, PTX86>;
648680def __nvvm_ff_to_e2m1x2_rn_relu_satfinite : NVPTXBuiltinSMAndPTX<" short(float, float)" , SM<" 100a" , [SM_101a, SM_120a]>, PTX86>;
649681
650682def __nvvm_e2m1x2_to_f16x2_rn : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(short)" , SM<" 100a" , [SM_101a, SM_120a]>, PTX86>;
651683def __nvvm_e2m1x2_to_f16x2_rn_relu : NVPTXBuiltinSMAndPTX<" _Vector<2, __fp16>(short)" , SM<" 100a" , [SM_101a, SM_120a]>, PTX86>;
652684
653- def __nvvm_f32x4_to_e2m1x4_rs_satfinite : NVPTXBuiltinSMAndPTX<" short(_Vector<4, float>, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
654- def __nvvm_f32x4_to_e2m1x4_rs_relu_satfinite : NVPTXBuiltinSMAndPTX<" short(_Vector<4, float>, uint32_t)" , SM<" 100a" , [SM_103a]>, PTX87>;
685+ def __nvvm_f32x4_to_e2m1x4_rs_satfinite :
686+ NVPTXBuiltinSMAndPTX<" short(_Vector<4, float>, uint32_t)" ,
687+ SM<" 100a" , [SM_103a]>, PTX87>;
688+ def __nvvm_f32x4_to_e2m1x4_rs_relu_satfinite :
689+ NVPTXBuiltinSMAndPTX<" short(_Vector<4, float>, uint32_t)" ,
690+ SM<" 100a" , [SM_103a]>, PTX87>;
655691
656692def __nvvm_ff_to_ue8m0x2_rz : NVPTXBuiltinSMAndPTX<" short(float, float)" , SM<" 100a" , [SM_101a, SM_120a]>, PTX86>;
657693def __nvvm_ff_to_ue8m0x2_rz_satfinite : NVPTXBuiltinSMAndPTX<" short(float, float)" , SM<" 100a" , [SM_101a, SM_120a]>, PTX86>;
0 commit comments