@@ -145,19 +145,23 @@ llvm.func @triton_gen.dpas(%c : vector<8xf32>, %a : vector<8xi16>, %b : vector<8
145
145
146
146
// -----
147
147
148
+ module attributes {" ttg.threads-per-warp" = 16 : i32 } {
148
149
llvm.func @matrix_2Dblockload (%ptr : !llvm.ptr , %base_width : i32 , %base_height : i32 , %base_pitch : i32 , %x : i32 , %y : i32 ) {
149
150
// expected-error @+1 {{'triton_gen.2Dblockload' op result size of 256 bits does not match the expected size of 128 bits}}
150
151
%0 = triton_gen.2Dblockload %ptr , %base_width , %base_height , %base_pitch , %x , %y {elem_size_in_bits =8 , tile_width =32 , tile_height =8 , v_blocks =1 , transpose =false , vnni_transform =false , cache_control =Default } : (!llvm.ptr , i32 , i32 , i32 , i32 , i32 ) -> vector <16 xi16 >
151
152
llvm.return
152
153
}
154
+ }
153
155
154
156
// -----
155
157
158
+ module attributes {" ttg.threads-per-warp" = 16 : i32 } {
156
159
llvm.func @matrix_2Dblockload (%ptr : !llvm.ptr , %base_width : i32 , %base_height : i32 , %base_pitch : i32 , %x : i32 , %y : i32 ) {
157
160
// expected-error @+1 {{'triton_gen.2Dblockload' op transpose and vnni_transform are mutually exclusive}}
158
161
%0 = triton_gen.2Dblockload %ptr , %base_width , %base_height , %base_pitch , %x , %y {elem_size_in_bits =8 , tile_width =16 , tile_height =8 , v_blocks =1 , transpose =true , vnni_transform =true , cache_control =Default } : (!llvm.ptr , i32 , i32 , i32 , i32 , i32 ) -> vector <2 xi32 >
159
162
llvm.return
160
163
}
164
+ }
161
165
162
166
// -----
163
167
@@ -177,19 +181,23 @@ llvm.func @matrix_2Dblockload(%ptr : !llvm.ptr, %base_width : i32, %base_height
177
181
178
182
// -----
179
183
184
+ module attributes {" ttg.threads-per-warp" = 16 : i32 } {
180
185
llvm.func @matrix_2Dblockload (%ptr : !llvm.ptr , %base_width : i32 , %base_height : i32 , %base_pitch : i32 , %x : i32 , %y : i32 ) {
181
186
// expected-error @+1 {{'triton_gen.2Dblockload' op transpose is only supported for 32 and 64 bit elements}}
182
187
%0 = triton_gen.2Dblockload %ptr , %base_width , %base_height , %base_pitch , %x , %y {elem_size_in_bits =8 , tile_width =32 , tile_height =8 , v_blocks =1 , transpose =true , vnni_transform =false , cache_control =Default } : (!llvm.ptr , i32 , i32 , i32 , i32 , i32 ) -> vector <8 xi16 >
183
188
llvm.return
184
189
}
190
+ }
185
191
186
192
// -----
187
193
194
+ module attributes {" ttg.threads-per-warp" = 16 : i32 } {
188
195
llvm.func @matrix_2Dblockload (%ptr : !llvm.ptr , %base_width : i32 , %base_height : i32 , %base_pitch : i32 , %x : i32 , %y : i32 ) {
189
196
// expected-error @+1 {{'triton_gen.2Dblockload' op vnni_transform is only supported for 8 and 16 bit elements}}
190
197
%0 = triton_gen.2Dblockload %ptr , %base_width , %base_height , %base_pitch , %x , %y {elem_size_in_bits =32 , tile_width =8 , tile_height =8 , v_blocks =1 , transpose =false , vnni_transform =true , cache_control =Default } : (!llvm.ptr , i32 , i32 , i32 , i32 , i32 ) -> vector <4 xi32 >
191
198
llvm.return
192
199
}
200
+ }
193
201
194
202
// -----
195
203
@@ -316,11 +324,13 @@ llvm.func @matrix_2Dblockload(%ptr : !llvm.ptr, %base_width : i32, %base_height
316
324
317
325
// -----
318
326
327
+ module attributes {" ttg.threads-per-warp" = 16 : i32 } {
319
328
llvm.func @matrix_2Dblockload (%ptr : !llvm.ptr , %base_width : i32 , %base_height : i32 , %base_pitch : i32 , %x : i32 , %y : i32 ) {
320
329
// expected-error @+1 {{'triton_gen.2Dblockload' op expecting result element type to be 32 bits}}
321
330
%0 = triton_gen.2Dblockload %ptr , %base_width , %base_height , %base_pitch , %x , %y {elem_size_in_bits =32 , tile_width =8 , tile_height =8 , v_blocks =1 , transpose =false , vnni_transform =false , cache_control =Default } : (!llvm.ptr , i32 , i32 , i32 , i32 , i32 ) -> vector <8 xi16 >
322
331
llvm.return
323
332
}
333
+ }
324
334
325
335
// -----
326
336
0 commit comments