@@ -14,9 +14,9 @@ func.func @test_stick_expansion_with_sat(%arg0: memref<16x8x128xf32>) -> memref<
14
14
// CHECK-DAG: [[MAP_1_:#.+]] = affine_map<()[s0] -> (s0 * 64)>
15
15
// CHECK-DAG: [[MAP_2_:#.+]] = affine_map<()[s0, s1] -> (s1 floordiv 64)>
16
16
// CHECK-DAG: [[MAP_3_:#.+]] = affine_map<()[s0, s1] -> (s0 + s1)>
17
- // CHECK-DAG: [[MAP_4_:#.+]] = affine_map<()[s0, s1] -> (s1 + 8)>
18
- // CHECK-DAG: [[MAP_5_:#.+]] = affine_map<()[s0, s1] -> (s1 + 16)>
19
- // CHECK-DAG: [[MAP_6_:#.+]] = affine_map<()[s0, s1] -> (s1 + 24)>
17
+ // CHECK-DAG: [[MAP_4_:#.+]] = affine_map<()[s0, s1] -> (s0 + 8)>
18
+ // CHECK-DAG: [[MAP_5_:#.+]] = affine_map<()[s0, s1] -> (s0 + 16)>
19
+ // CHECK-DAG: [[MAP_6_:#.+]] = affine_map<()[s0, s1] -> (s0 + 24)>
20
20
// CHECK-LABEL: func.func @test_stick_expansion_with_sat
21
21
// CHECK-SAME: ([[PARAM_0_:%.+]]: memref<16x8x128xf32>) -> memref<16x8x128xf16, #map> {
22
22
// CHECK-DAG: [[CST_28_:%.+]] = arith.constant 28 : index
@@ -40,7 +40,7 @@ func.func @test_stick_expansion_with_sat(%arg0: memref<16x8x128xf32>) -> memref<
40
40
// CHECK: krnl.prefetch [[PARAM_0_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_2_]]{{.}}, read, locality<1>, data : memref<16x8x128xf32>
41
41
// CHECK: krnl.prefetch [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_2_]]{{.}}, write, locality<1>, data : memref<16x8x128xf16, #map>
42
42
// CHECK: affine.for [[I_3_:%.+]] = 0 to 64 step 32 {
43
- // CHECK: [[VAR_5_:%.+]] = affine.apply [[MAP_3_]](){{.}}[[VAR_2_ ]], [[I_3_ ]]{{.}}
43
+ // CHECK: [[VAR_5_:%.+]] = affine.apply [[MAP_3_]](){{.}}[[I_3_ ]], [[VAR_2_ ]]{{.}}
44
44
// CHECK-DAG: [[LOAD_PARAM_0_MEM_:%.+]] = vector.load [[PARAM_0_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_5_]]{{.}} : memref<16x8x128xf32>, vector<4xf32>
45
45
// CHECK-DAG: [[VAR_7_:%.+]] = arith.addi [[VAR_5_]], [[CST_4_]] : index
46
46
// CHECK-NOT: separator of consecutive DAGs
@@ -86,11 +86,11 @@ func.func @test_stick_expansion_with_sat(%arg0: memref<16x8x128xf32>) -> memref<
86
86
// CHECK-DAG: [[VAR_39_:%.+]] = "zlow.vec_f32_to_dlf16"([[VAR_33_]], [[VAR_34_]]) : (vector<4xf32>, vector<4xf32>) -> vector<8xf16>
87
87
// CHECK: [[VAR_40_:%.+]] = "zlow.vec_f32_to_dlf16"([[VAR_35_]], [[VAR_36_]]) : (vector<4xf32>, vector<4xf32>) -> vector<8xf16>
88
88
// CHECK: vector.store [[VAR_37_]], [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[I_3_]]{{.}} : memref<2x64xf16>, vector<8xf16>
89
- // CHECK: [[VAR_41_:%.+]] = affine.apply [[MAP_4_]](){{.}}[[VAR_2_ ]], [[I_3_ ]]{{.}}
89
+ // CHECK: [[VAR_41_:%.+]] = affine.apply [[MAP_4_]](){{.}}[[I_3_ ]], [[VAR_2_ ]]{{.}}
90
90
// CHECK: vector.store [[VAR_38_]], [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[VAR_4_]]1] : memref<2x64xf16>, vector<8xf16>
91
- // CHECK: [[VAR_42_:%.+]] = affine.apply [[MAP_5_]](){{.}}[[VAR_2_ ]], [[I_3_ ]]{{.}}
91
+ // CHECK: [[VAR_42_:%.+]] = affine.apply [[MAP_5_]](){{.}}[[I_3_ ]], [[VAR_2_ ]]{{.}}
92
92
// CHECK: vector.store [[VAR_39_]], [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[VAR_4_]]2] : memref<2x64xf16>, vector<8xf16>
93
- // CHECK: [[VAR_43_:%.+]] = affine.apply [[MAP_6_]](){{.}}[[VAR_2_ ]], [[I_3_ ]]{{.}}
93
+ // CHECK: [[VAR_43_:%.+]] = affine.apply [[MAP_6_]](){{.}}[[I_3_ ]], [[VAR_2_ ]]{{.}}
94
94
// CHECK: vector.store [[VAR_40_]], [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[VAR_4_]]3] : memref<2x64xf16>, vector<8xf16>
95
95
// CHECK: }
96
96
// CHECK: }
@@ -112,9 +112,9 @@ func.func @test_stick_expansion_without_sat(%arg0: memref<16x8x128xf32>) -> memr
112
112
// CHECK-DAG: [[MAP_1_:#.+]] = affine_map<()[s0] -> (s0 * 64)>
113
113
// CHECK-DAG: [[MAP_2_:#.+]] = affine_map<()[s0, s1] -> (s1 floordiv 64)>
114
114
// CHECK-DAG: [[MAP_3_:#.+]] = affine_map<()[s0, s1] -> (s0 + s1)>
115
- // CHECK-DAG: [[MAP_4_:#.+]] = affine_map<()[s0, s1] -> (s1 + 8)>
116
- // CHECK-DAG: [[MAP_5_:#.+]] = affine_map<()[s0, s1] -> (s1 + 16)>
117
- // CHECK-DAG: [[MAP_6_:#.+]] = affine_map<()[s0, s1] -> (s1 + 24)>
115
+ // CHECK-DAG: [[MAP_4_:#.+]] = affine_map<()[s0, s1] -> (s0 + 8)>
116
+ // CHECK-DAG: [[MAP_5_:#.+]] = affine_map<()[s0, s1] -> (s0 + 16)>
117
+ // CHECK-DAG: [[MAP_6_:#.+]] = affine_map<()[s0, s1] -> (s0 + 24)>
118
118
// CHECK-LABEL: func.func @test_stick_expansion_without_sat
119
119
// CHECK-SAME: ([[PARAM_0_:%.+]]: memref<16x8x128xf32>) -> memref<16x8x128xf16, #map> {
120
120
// CHECK-DAG: [[CST_28_:%.+]] = arith.constant 28 : index
@@ -136,7 +136,7 @@ func.func @test_stick_expansion_without_sat(%arg0: memref<16x8x128xf32>) -> memr
136
136
// CHECK: krnl.prefetch [[PARAM_0_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_2_]]{{.}}, read, locality<1>, data : memref<16x8x128xf32>
137
137
// CHECK: krnl.prefetch [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_2_]]{{.}}, write, locality<1>, data : memref<16x8x128xf16, #map>
138
138
// CHECK: affine.for [[I_3_:%.+]] = 0 to 64 step 32 {
139
- // CHECK: [[VAR_5_:%.+]] = affine.apply [[MAP_3_]](){{.}}[[VAR_2_ ]], [[I_3_ ]]{{.}}
139
+ // CHECK: [[VAR_5_:%.+]] = affine.apply [[MAP_3_]](){{.}}[[I_3_ ]], [[VAR_2_ ]]{{.}}
140
140
// CHECK-DAG: [[LOAD_PARAM_0_MEM_:%.+]] = vector.load [[PARAM_0_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_5_]]{{.}} : memref<16x8x128xf32>, vector<4xf32>
141
141
// CHECK-DAG: [[VAR_7_:%.+]] = arith.addi [[VAR_5_]], [[CST_4_]] : index
142
142
// CHECK-NOT: separator of consecutive DAGs
@@ -164,11 +164,11 @@ func.func @test_stick_expansion_without_sat(%arg0: memref<16x8x128xf32>) -> memr
164
164
// CHECK-DAG: [[VAR_23_:%.+]] = "zlow.vec_f32_to_dlf16"([[LOAD_PARAM_0_MEM_4_]], [[LOAD_PARAM_0_MEM_5_]]) : (vector<4xf32>, vector<4xf32>) -> vector<8xf16>
165
165
// CHECK: [[VAR_24_:%.+]] = "zlow.vec_f32_to_dlf16"([[LOAD_PARAM_0_MEM_6_]], [[LOAD_PARAM_0_MEM_7_]]) : (vector<4xf32>, vector<4xf32>) -> vector<8xf16>
166
166
// CHECK: vector.store [[VAR_21_]], [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[I_3_]]{{.}} : memref<2x64xf16>, vector<8xf16>
167
- // CHECK: [[VAR_25_:%.+]] = affine.apply [[MAP_4_]](){{.}}[[VAR_2_ ]], [[I_3_ ]]{{.}}
167
+ // CHECK: [[VAR_25_:%.+]] = affine.apply [[MAP_4_]](){{.}}[[I_3_ ]], [[VAR_2_ ]]{{.}}
168
168
// CHECK: vector.store [[VAR_22_]], [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[VAR_25_]]{{.}} : memref<2x64xf16>, vector<8xf16>
169
- // CHECK: [[VAR_26_:%.+]] = affine.apply [[MAP_5_]](){{.}}[[VAR_2_ ]], [[I_3_ ]]{{.}}
169
+ // CHECK: [[VAR_26_:%.+]] = affine.apply [[MAP_5_]](){{.}}[[I_3_ ]], [[VAR_2_ ]]{{.}}
170
170
// CHECK: vector.store [[VAR_23_]], [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[VAR_26_]]{{.}} : memref<2x64xf16>, vector<8xf16>
171
- // CHECK: [[VAR_27_:%.+]] = affine.apply [[MAP_6_]](){{.}}[[VAR_2_ ]], [[I_3_ ]]{{.}}
171
+ // CHECK: [[VAR_27_:%.+]] = affine.apply [[MAP_6_]](){{.}}[[I_3_ ]], [[VAR_2_ ]]{{.}}
172
172
// CHECK: vector.store [[VAR_24_]], [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[VAR_27_]]{{.}} : memref<2x64xf16>, vector<8xf16>
173
173
// CHECK: }
174
174
// CHECK: }
@@ -196,7 +196,7 @@ func.func @test_unstick_expansion(%arg0: memref<16x8x128xf16, #map>) -> memref<1
196
196
// CHECK-DAG: [[MAP_7_:#.+]] = affine_map<()[s0] -> (-s0 + 121)>
197
197
// CHECK-DAG: [[MAP_8_:#.+]] = affine_map<()[s0] -> ((-s0) mod 8)>
198
198
// CHECK-DAG: [[MAP_9_:#.+]] = affine_map<()[s0] -> (-s0 - (-s0) mod 8 + 128)>
199
- // CHECK-DAG: [[MAP_10_:#.+]] = affine_map<(d0)[s0, s1] -> (d0 + s0 + s1 )>
199
+ // CHECK-DAG: [[MAP_10_:#.+]] = affine_map<(d0)[s0, s1] -> (d0 + s1 + s0 )>
200
200
// CHECK-LABEL: func.func @test_unstick_expansion
201
201
// CHECK-SAME: ([[PARAM_0_:%.+]]: memref<16x8x128xf16, #map>) -> memref<16x8x128xf32> {
202
202
// CHECK-DAG: [[CST_1_:%.+]] = arith.constant 1 : index
@@ -232,52 +232,51 @@ func.func @test_unstick_expansion(%arg0: memref<16x8x128xf16, #map>) -> memref<1
232
232
// CHECK-DAG: [[LOAD_VAR_reinterpret_cast_MEM_2_:%.+]] = vector.load [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[VAR_8_]]{{.}} : memref<2x64xf16>, vector<8xf16>
233
233
// CHECK-DAG: [[VAR_10_:%.+]] = affine.apply [[MAP_5_]]([[I_3_]])
234
234
// CHECK: [[LOAD_VAR_reinterpret_cast_MEM_3_:%.+]] = vector.load [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[VAR_10_]]{{.}} : memref<2x64xf16>, vector<8xf16>
235
- // CHECK: [[output1_ :%.+]], [[VAR_output2_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
236
- // CHECK: [[output1_0_ :%.+]], [[VAR_output2_1_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_1_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
237
- // CHECK: [[output1_2_ :%.+]], [[VAR_output2_3_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_2_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
238
- // CHECK: [[output1_4_ :%.+]], [[VAR_output2_5_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_3_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
235
+ // CHECK: [[VAR_output1_ :%.+]], [[VAR_output2_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
236
+ // CHECK: [[VAR_output1_0_ :%.+]], [[VAR_output2_1_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_1_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
237
+ // CHECK: [[VAR_output1_2_ :%.+]], [[VAR_output2_3_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_2_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
238
+ // CHECK: [[VAR_output1_4_ :%.+]], [[VAR_output2_5_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_3_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
239
239
// CHECK: [[VAR_12_:%.+]] = affine.apply [[MAP_6_]]([[I_3_]]){{.}}[[VAR_2_]]{{.}}
240
- // CHECK: vector.store [[output1_ ]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]2] : memref<16x8x128xf32>, vector<4xf32>
240
+ // CHECK: vector.store [[VAR_output1_ ]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]2] : memref<16x8x128xf32>, vector<4xf32>
241
241
// CHECK: [[VAR_13_:%.+]] = arith.addi [[VAR_12_]], [[CST_4_]] : index
242
242
// CHECK: vector.store [[VAR_output2_]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]3] : memref<16x8x128xf32>, vector<4xf32>
243
243
// CHECK: [[VAR_14_:%.+]] = arith.addi [[VAR_12_]], [[CST_8_]] : index
244
- // CHECK: vector.store [[output1_0_ ]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]4] : memref<16x8x128xf32>, vector<4xf32>
244
+ // CHECK: vector.store [[VAR_output1_0_ ]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]4] : memref<16x8x128xf32>, vector<4xf32>
245
245
// CHECK: [[VAR_15_:%.+]] = arith.addi [[VAR_12_]], [[CST_12_]] : index
246
246
// CHECK: vector.store [[VAR_output2_1_]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]5] : memref<16x8x128xf32>, vector<4xf32>
247
247
// CHECK: [[VAR_16_:%.+]] = arith.addi [[VAR_12_]], [[CST_16_]] : index
248
- // CHECK: vector.store [[output1_2_ ]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]6] : memref<16x8x128xf32>, vector<4xf32>
248
+ // CHECK: vector.store [[VAR_output1_2_ ]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]6] : memref<16x8x128xf32>, vector<4xf32>
249
249
// CHECK: [[VAR_17_:%.+]] = arith.addi [[VAR_12_]], [[CST_20_]] : index
250
250
// CHECK: vector.store [[VAR_output2_3_]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]7] : memref<16x8x128xf32>, vector<4xf32>
251
251
// CHECK: [[VAR_18_:%.+]] = arith.addi [[VAR_12_]], [[CST_24_]] : index
252
- // CHECK: vector.store [[output1_4_ ]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]8] : memref<16x8x128xf32>, vector<4xf32>
252
+ // CHECK: vector.store [[VAR_output1_4_ ]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]8] : memref<16x8x128xf32>, vector<4xf32>
253
253
// CHECK: [[VAR_19_:%.+]] = arith.addi [[VAR_12_]], [[CST_28_]] : index
254
254
// CHECK: vector.store [[VAR_output2_5_]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]9] : memref<16x8x128xf32>, vector<4xf32>
255
255
// CHECK: }
256
256
// CHECK: } else {
257
257
// CHECK: [[LOAD_VAR_reinterpret_cast_MEM_4_:%.+]] = affine.apply [[MAP_7_]](){{.}}[[VAR_2_]]{{.}}
258
258
// CHECK: scf.for [[I_4_:%.+]] = [[CST_0_]] to [[LOAD_VAR_reinterpret_cast_MEM_4_]] step [[CST_8_]] {
259
259
// CHECK: [[LOAD_VAR_reinterpret_cast_MEM_5_:%.+]] = vector.load [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[I_4_]]{{.}} : memref<2x64xf16>, vector<8xf16>
260
- // CHECK: [[output1_0_ ]], [[VAR_output2_1_1_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_5_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
260
+ // CHECK: [[VAR_output1_0_1_:%.+ ]], [[VAR_output2_1_1_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_5_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
261
261
// CHECK: [[VAR_10_1_:%.+]] = affine.apply [[MAP_6_]]([[I_4_]]){{.}}[[VAR_2_]]{{.}}
262
- // CHECK: vector.store [[output1_0_ ]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]0] : memref<16x8x128xf32>, vector<4xf32>
262
+ // CHECK: vector.store [[VAR_output1_0_1_ ]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]0] : memref<16x8x128xf32>, vector<4xf32>
263
263
// CHECK: [[LOAD_VAR_reinterpret_cast_MEM_3_:%.+]] = arith.addi [[VAR_10_1_]], [[CST_4_]] : index
264
264
// CHECK: vector.store [[VAR_output2_1_1_]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]1] : memref<16x8x128xf32>, vector<4xf32>
265
265
// CHECK: }
266
266
// CHECK-DAG: [[VAR_6_1_:%.+]] = affine.apply [[MAP_8_]](){{.}}[[VAR_2_]]{{.}}
267
267
// CHECK-DAG: [[LOAD_VAR_reinterpret_cast_MEM_1_:%.+]] = affine.apply [[MAP_9_]](){{.}}[[VAR_2_]]{{.}}
268
268
// CHECK: [[LOAD_VAR_reinterpret_cast_MEM_6_:%.+]] = vector.load [[VAR_reinterpret_cast_]]{{.}}[[VAR_4_]], [[LOAD_VAR_reinterpret_cast_MEM_1_]]{{.}} : memref<2x64xf16>, vector<8xf16>
269
- // CHECK: [[output1_ ]], [[VAR_output2_1_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_6_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
269
+ // CHECK: [[VAR_output1_1_:%.+ ]], [[VAR_output2_1_:%.+]] = "zlow.vec_dlf16_to_f32"([[LOAD_VAR_reinterpret_cast_MEM_6_]]) : (vector<8xf16>) -> (vector<4xf32>, vector<4xf32>)
270
270
// CHECK: [[RES_1_:%.+]] = memref.alloca() {{.*}}: memref<8xf32>
271
- // CHECK: vector.store [[output1_ ]], [[RES_1_]]{{.}}[[CST_0_]]{{.}} : memref<8xf32>, vector<4xf32>
271
+ // CHECK: vector.store [[VAR_output1_1_ ]], [[RES_1_]]{{.}}[[CST_0_]]{{.}} : memref<8xf32>, vector<4xf32>
272
272
// CHECK: vector.store [[VAR_output2_1_]], [[RES_1_]]{{.}}[[CST_4_]]{{.}} : memref<8xf32>, vector<4xf32>
273
273
// CHECK: scf.for [[I_5_:%.+]] = [[CST_0_]] to [[VAR_6_1_]] step [[CST_1_]] {
274
274
// CHECK-DAG: [[LOAD_VAR_reinterpret_cast_MEM_5_:%.+]] = krnl.load [[RES_1_]]{{.}}[[I_5_]]{{.}} : memref<8xf32>
275
- // CHECK-DAG: [[VAR_10_2_:%.+]] = affine.apply [[MAP_10_]]([[I_5_]]){{.}}[[VAR_2_ ]], [[LOAD_VAR_reinterpret_cast_MEM_1_ ]]{{.}}
275
+ // CHECK-DAG: [[VAR_10_2_:%.+]] = affine.apply [[MAP_10_]]([[I_5_]]){{.}}[[LOAD_VAR_reinterpret_cast_MEM_1_ ]], [[VAR_2_ ]]{{.}}
276
276
// CHECK: krnl.store [[LOAD_VAR_reinterpret_cast_MEM_5_]], [[RES_]]{{.}}[[VAR_1_]]#0, [[VAR_1_]]#1, [[VAR_1_]]0] : memref<16x8x128xf32>
277
277
// CHECK: }
278
278
// CHECK: }
279
279
// CHECK: }
280
280
// CHECK: return [[RES_]] : memref<16x8x128xf32>
281
281
// CHECK: }
282
- }
283
-
282
+ }
0 commit comments