@@ -28,7 +28,7 @@ module attributes {"ttg.num-ctas" = 1 : i32, "ttg.num-warps" = 1 : i32} {
28
28
%4 = arith.addi %3 , %2 : tensor <128 xi32 , #blocked0 >
29
29
%5 = tt.splat %N: i32 -> tensor <128 xi32 , #blocked0 >
30
30
%7 = arith.cmpi slt , %4 , %5: tensor <128 xi32 , #blocked0 >
31
- // CHECK: %[[mask:.*]] = llvm.extractvalue %{{.*}} : !llvm.struct<(i1, i1, i1, i1)>
31
+ // CHECK: %[[mask:.*]] = llvm.icmp "slt"
32
32
// CHECK: %[[offset:.*]] = llvm.select %[[mask]]
33
33
// CHECK: rocdl.raw.ptr.buffer.load {{.*}}, %[[offset]]
34
34
%ret = amdgpu.buffer_load %arg0 [%offset ], %7 stride = %c256_i32 : tensor <128 xf32 , #blocked0 >
@@ -51,7 +51,7 @@ module attributes {"ttg.num-ctas" = 1 : i32, "ttg.num-warps" = 1 : i32} {
51
51
%5 = tt.splat %N: i32 -> tensor <128 xi32 , #blocked0 >
52
52
%7 = arith.cmpi slt , %4 , %5: tensor <128 xi32 , #blocked0 >
53
53
%other = arith.constant dense <0.00e+00 > : tensor <128 xf32 , #blocked0 >
54
- // CHECK: %[[mask:.*]] = llvm.extractvalue %{{.*}} : !llvm.struct<(i1, i1, i1, i1)>
54
+ // CHECK: %[[mask:.*]] = llvm.icmp "slt"
55
55
// CHECK: %[[offset:.*]] = llvm.select %[[mask]]
56
56
// CHECK: rocdl.raw.ptr.buffer.load {{.*}}, %[[offset]]
57
57
// CHECK: llvm.select
@@ -90,7 +90,7 @@ module attributes {"ttg.num-ctas" = 1 : i32, "ttg.num-warps" = 1 : i32} {
90
90
%4 = arith.addi %3 , %2 : tensor <128 xi32 , #blocked0 >
91
91
%5 = tt.splat %N: i32 -> tensor <128 xi32 , #blocked0 >
92
92
%7 = arith.cmpi slt , %4 , %5: tensor <128 xi32 , #blocked0 >
93
- // CHECK: %[[mask0:.*]] = llvm.extractvalue %{{.*}} : !llvm.struct<(i1, i1, i1, i1)>
93
+ // CHECK: %[[mask0:.*]] = llvm.icmp "slt"
94
94
// CHECK: %[[mask1:.*]] = llvm.mlir.constant(true) : i1
95
95
// CHECK: %[[mask2:.*]] = llvm.and %[[mask1]], %[[mask0]]
96
96
// CHECK: %[[offset:.*]] = llvm.select %[[mask2]]
@@ -216,7 +216,7 @@ module attributes {"ttg.num-ctas" = 1 : i32, "ttg.num-warps" = 1 : i32} {
216
216
%4 = arith.addi %3 , %2 : tensor <128 xi32 , #blocked0 >
217
217
%5 = tt.splat %N: i32 -> tensor <128 xi32 , #blocked0 >
218
218
%mask = arith.cmpi slt , %4 , %5: tensor <128 xi32 , #blocked0 >
219
- // CHECK: %[[mask0:.*]] = llvm.extractvalue %{{.*}} : !llvm.struct<(i1, i1, i1, i1)>
219
+ // CHECK: %[[mask0:.*]] = llvm.icmp "slt"
220
220
// There should be a single release fence before any atomics
221
221
// CHECK: llvm.fence syncscope("agent") release
222
222
// CHECK: %[[mask1:.*]] = llvm.mlir.constant(true) : i1
0 commit comments