@@ -317,13 +317,13 @@ module attributes {gpu.container_module} {
317317 }
318318 }
319319}
320- // CHECK-SAME: (%[[VAL_0:.*]]: memref<?x?xf32>) kernel {
321- // CHECK: %[[VAL_1:.*]] = arith.constant 1 : index
322- // CHECK: %[[VAL_2:.*]] = memref.dim %[[VAL_0]], %[[VAL_1]] : memref<?x?xf32>
323- // CHECK: %[[VAL_3:.*]] = arith.constant 0 : index
324- // CHECK: affine.for %[[VAL_4:.*]] = %[[VAL_3]] to %[[VAL_2]] step 32 {
325- // CHECK: }
326- // CHECK: gpu.return
320+ // CHECK-SAME: (%[[VAL_0:.*]]: memref<?x?xf32>) kernel {
321+ // CHECK: %[[VAL_1:.*]] = arith.constant 1 : index
322+ // CHECK: %[[VAL_2:.*]] = memref.dim %[[VAL_0]], %[[VAL_1]] : memref<?x?xf32>
323+ // CHECK: %[[VAL_3:.*]] = arith.constant 0 : index
324+ // CHECK: affine.for %{{.*}} = %[[VAL_3]] to %[[VAL_2]] step 32 {
325+ // CHECK: }
326+ // CHECK: gpu.return
327327
328328// -----
329329
@@ -344,15 +344,15 @@ module {
344344 }
345345}
346346
347- // CHECK-NEXT: %[[VAL_0:.*]] = arith.constant 1 : index
348- // CHECK-NEXT: gpu.launch blocks(%[[VAL_1:.*]], %[[VAL_2:.*]], %[[VAL_3:.*]]) in (%[[VAL_4:.*]] = %[[VAL_0]], %[[VAL_5:.*]] = %[[VAL_0]], %[[VAL_6:.*]] = %[[VAL_0]]) threads(%[[VAL_7:.*]], %[[VAL_8:.*]], %[[VAL_9:.*]]) in (%[[VAL_10:.*]] = %[[VAL_0]], %[[VAL_11:.*]] = %[[VAL_0]], %[[VAL_12:.*]] = %[[VAL_0]]) {
349- // CHECK-NEXT: %[[VAL_13:.*]] = gpu.thread_id x
350- // CHECK-NEXT: %[[VAL_14:.*]] = arith.constant 128 : index
351- // CHECK-NEXT: affine.for %[[VAL_15:.*]] = %[[VAL_13]] to %[[VAL_14]] step 8 {
352- // CHECK-NEXT: }
353- // CHECK-NEXT: gpu.terminator
347+ // CHECK-NEXT: %[[VAL_0:.*]] = arith.constant 1 : index
348+ // CHECK-NEXT: gpu.launch blocks(%[[VAL_1:.*]], %[[VAL_2:.*]], %[[VAL_3:.*]]) in (%[[VAL_4:.*]] = %[[VAL_0]], %[[VAL_5:.*]] = %[[VAL_0]], %[[VAL_6:.*]] = %[[VAL_0]]) threads(%[[VAL_7:.*]], %[[VAL_8:.*]], %[[VAL_9:.*]]) in (%[[VAL_10:.*]] = %[[VAL_0]], %[[VAL_11:.*]] = %[[VAL_0]], %[[VAL_12:.*]] = %[[VAL_0]]) {
349+ // CHECK-NEXT: %[[VAL_13:.*]] = gpu.thread_id x
350+ // CHECK-NEXT: %[[VAL_14:.*]] = arith.constant 128 : index
351+ // CHECK-NEXT: affine.for %{{.*}} = %[[VAL_13]] to %[[VAL_14]] step 8 {
354352// CHECK-NEXT: }
355- // CHECK-NEXT: return
353+ // CHECK-NEXT: gpu.terminator
354+ // CHECK-NEXT: }
355+ // CHECK-NEXT: return
356356
357357// -----
358358
0 commit comments