@@ -145,19 +145,23 @@ llvm.func @triton_gen.dpas(%c : vector<8xf32>, %a : vector<8xi16>, %b : vector<8
145145
146146// -----
147147
148+ module attributes {" ttg.threads-per-warp" = 16 : i32 } {
148149llvm.func @matrix_2Dblockload (%ptr : !llvm.ptr , %base_width : i32 , %base_height : i32 , %base_pitch : i32 , %x : i32 , %y : i32 ) {
149150 // expected-error @+1 {{'triton_gen.2Dblockload' op result size of 256 bits does not match the expected size of 128 bits}}
150151 %0 = triton_gen.2Dblockload %ptr , %base_width , %base_height , %base_pitch , %x , %y {elem_size_in_bits =8 , tile_width =32 , tile_height =8 , v_blocks =1 , transpose =false , vnni_transform =false , cache_control =Default } : (!llvm.ptr , i32 , i32 , i32 , i32 , i32 ) -> vector <16 xi16 >
151152 llvm.return
152153}
154+ }
153155
154156// -----
155157
158+ module attributes {" ttg.threads-per-warp" = 16 : i32 } {
156159llvm.func @matrix_2Dblockload (%ptr : !llvm.ptr , %base_width : i32 , %base_height : i32 , %base_pitch : i32 , %x : i32 , %y : i32 ) {
157160 // expected-error @+1 {{'triton_gen.2Dblockload' op transpose and vnni_transform are mutually exclusive}}
158161 %0 = triton_gen.2Dblockload %ptr , %base_width , %base_height , %base_pitch , %x , %y {elem_size_in_bits =8 , tile_width =16 , tile_height =8 , v_blocks =1 , transpose =true , vnni_transform =true , cache_control =Default } : (!llvm.ptr , i32 , i32 , i32 , i32 , i32 ) -> vector <2 xi32 >
159162 llvm.return
160163}
164+ }
161165
162166// -----
163167
@@ -177,19 +181,23 @@ llvm.func @matrix_2Dblockload(%ptr : !llvm.ptr, %base_width : i32, %base_height
177181
178182// -----
179183
184+ module attributes {" ttg.threads-per-warp" = 16 : i32 } {
180185llvm.func @matrix_2Dblockload (%ptr : !llvm.ptr , %base_width : i32 , %base_height : i32 , %base_pitch : i32 , %x : i32 , %y : i32 ) {
181186 // expected-error @+1 {{'triton_gen.2Dblockload' op transpose is only supported for 32 and 64 bit elements}}
182187 %0 = triton_gen.2Dblockload %ptr , %base_width , %base_height , %base_pitch , %x , %y {elem_size_in_bits =8 , tile_width =32 , tile_height =8 , v_blocks =1 , transpose =true , vnni_transform =false , cache_control =Default } : (!llvm.ptr , i32 , i32 , i32 , i32 , i32 ) -> vector <8 xi16 >
183188 llvm.return
184189}
190+ }
185191
186192// -----
187193
194+ module attributes {" ttg.threads-per-warp" = 16 : i32 } {
188195llvm.func @matrix_2Dblockload (%ptr : !llvm.ptr , %base_width : i32 , %base_height : i32 , %base_pitch : i32 , %x : i32 , %y : i32 ) {
189196 // expected-error @+1 {{'triton_gen.2Dblockload' op vnni_transform is only supported for 8 and 16 bit elements}}
190197 %0 = triton_gen.2Dblockload %ptr , %base_width , %base_height , %base_pitch , %x , %y {elem_size_in_bits =32 , tile_width =8 , tile_height =8 , v_blocks =1 , transpose =false , vnni_transform =true , cache_control =Default } : (!llvm.ptr , i32 , i32 , i32 , i32 , i32 ) -> vector <4 xi32 >
191198 llvm.return
192199}
200+ }
193201
194202// -----
195203
@@ -316,11 +324,13 @@ llvm.func @matrix_2Dblockload(%ptr : !llvm.ptr, %base_width : i32, %base_height
316324
317325// -----
318326
327+ module attributes {" ttg.threads-per-warp" = 16 : i32 } {
319328llvm.func @matrix_2Dblockload (%ptr : !llvm.ptr , %base_width : i32 , %base_height : i32 , %base_pitch : i32 , %x : i32 , %y : i32 ) {
320329 // expected-error @+1 {{'triton_gen.2Dblockload' op expecting result element type to be 32 bits}}
321330 %0 = triton_gen.2Dblockload %ptr , %base_width , %base_height , %base_pitch , %x , %y {elem_size_in_bits =32 , tile_width =8 , tile_height =8 , v_blocks =1 , transpose =false , vnni_transform =false , cache_control =Default } : (!llvm.ptr , i32 , i32 , i32 , i32 , i32 ) -> vector <8 xi16 >
322331 llvm.return
323332}
333+ }
324334
325335// -----
326336
0 commit comments