@@ -142,27 +142,27 @@ define i32 @test(ptr %pix1, ptr %pix2, i64 %idx.ext, i64 %idx.ext63, ptr %add.pt
142
142
; CHECK-NEXT: [[TMP66:%.*]] = load <2 x i8>, ptr [[ARRAYIDX8]], align 1
143
143
; CHECK-NEXT: [[TMP102:%.*]] = zext <2 x i8> [[TMP66]] to <2 x i32>
144
144
; CHECK-NEXT: [[TMP67:%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[PIX2]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
145
- ; CHECK-NEXT: [[TMP78 :%.*]] = zext <2 x i8> [[TMP67]] to <2 x i32>
145
+ ; CHECK-NEXT: [[TMP77 :%.*]] = zext <2 x i8> [[TMP67]] to <2 x i32>
146
146
; CHECK-NEXT: [[TMP73:%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[TMP1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
147
- ; CHECK-NEXT: [[TMP81 :%.*]] = zext <2 x i8> [[TMP73]] to <2 x i32>
148
- ; CHECK-NEXT: [[TMP71 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX5]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
149
- ; CHECK-NEXT: [[TMP76:%.*]] = zext <2 x i8> [[TMP71 ]] to <2 x i32>
150
- ; CHECK-NEXT: [[TMP87:%.*]] = sub <2 x i32> [[TMP81 ]], [[TMP76]]
147
+ ; CHECK-NEXT: [[TMP78 :%.*]] = zext <2 x i8> [[TMP73]] to <2 x i32>
148
+ ; CHECK-NEXT: [[TMP85 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX5]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
149
+ ; CHECK-NEXT: [[TMP76:%.*]] = zext <2 x i8> [[TMP85 ]] to <2 x i32>
150
+ ; CHECK-NEXT: [[TMP87:%.*]] = sub <2 x i32> [[TMP78 ]], [[TMP76]]
151
151
; CHECK-NEXT: [[TMP88:%.*]] = shl <2 x i32> [[TMP87]], <i32 16, i32 16>
152
- ; CHECK-NEXT: [[TMP83 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX22]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
153
- ; CHECK-NEXT: [[TMP80:%.*]] = zext <2 x i8> [[TMP83 ]] to <2 x i32>
154
- ; CHECK-NEXT: [[TMP77 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX25]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
155
- ; CHECK-NEXT: [[TMP82:%.*]] = zext <2 x i8> [[TMP77 ]] to <2 x i32>
156
- ; CHECK-NEXT: [[TMP85 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX27]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
157
- ; CHECK-NEXT: [[TMP84:%.*]] = zext <2 x i8> [[TMP85 ]] to <2 x i32>
152
+ ; CHECK-NEXT: [[TMP89 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX22]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
153
+ ; CHECK-NEXT: [[TMP80:%.*]] = zext <2 x i8> [[TMP89 ]] to <2 x i32>
154
+ ; CHECK-NEXT: [[TMP81 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX25]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
155
+ ; CHECK-NEXT: [[TMP82:%.*]] = zext <2 x i8> [[TMP81 ]] to <2 x i32>
156
+ ; CHECK-NEXT: [[TMP83 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX27]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
157
+ ; CHECK-NEXT: [[TMP84:%.*]] = zext <2 x i8> [[TMP83 ]] to <2 x i32>
158
158
; CHECK-NEXT: [[TMP95:%.*]] = sub <2 x i32> [[TMP82]], [[TMP84]]
159
159
; CHECK-NEXT: [[TMP96:%.*]] = shl <2 x i32> [[TMP95]], <i32 16, i32 16>
160
160
; CHECK-NEXT: [[TMP97:%.*]] = insertelement <2 x i32> [[TMP102]], i32 [[CONV33]], i32 1
161
- ; CHECK-NEXT: [[TMP89 :%.*]] = sub <2 x i32> [[TMP97]], [[TMP80]]
162
- ; CHECK-NEXT: [[TMP105:%.*]] = add <2 x i32> [[TMP96]], [[TMP89 ]]
161
+ ; CHECK-NEXT: [[TMP90 :%.*]] = sub <2 x i32> [[TMP97]], [[TMP80]]
162
+ ; CHECK-NEXT: [[TMP105:%.*]] = add <2 x i32> [[TMP96]], [[TMP90 ]]
163
163
; CHECK-NEXT: [[TMP86:%.*]] = insertelement <2 x i32> [[TMP102]], i32 [[CONV1]], i32 0
164
- ; CHECK-NEXT: [[TMP99 :%.*]] = sub <2 x i32> [[TMP86]], [[TMP78 ]]
165
- ; CHECK-NEXT: [[TMP92:%.*]] = add <2 x i32> [[TMP88]], [[TMP99 ]]
164
+ ; CHECK-NEXT: [[TMP98 :%.*]] = sub <2 x i32> [[TMP86]], [[TMP77 ]]
165
+ ; CHECK-NEXT: [[TMP92:%.*]] = add <2 x i32> [[TMP88]], [[TMP98 ]]
166
166
; CHECK-NEXT: [[TMP93:%.*]] = shufflevector <2 x i32> [[TMP105]], <2 x i32> [[TMP92]], <2 x i32> <i32 0, i32 2>
167
167
; CHECK-NEXT: [[TMP106:%.*]] = add <2 x i32> [[TMP105]], [[TMP92]]
168
168
; CHECK-NEXT: [[TMP91:%.*]] = sub <2 x i32> [[TMP92]], [[TMP105]]
@@ -182,21 +182,21 @@ define i32 @test(ptr %pix1, ptr %pix2, i64 %idx.ext, i64 %idx.ext63, ptr %add.pt
182
182
; CHECK-NEXT: [[MUL_I61_4:%.*]] = mul i32 [[AND_I60_4]], 65535
183
183
; CHECK-NEXT: [[TMP104:%.*]] = load <2 x i8>, ptr [[ARRAYIDX8_1]], align 1
184
184
; CHECK-NEXT: [[TMP110:%.*]] = zext <2 x i8> [[TMP104]] to <2 x i32>
185
- ; CHECK-NEXT: [[TMP98 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ADD_PTR644]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
186
- ; CHECK-NEXT: [[TMP103:%.*]] = zext <2 x i8> [[TMP98 ]] to <2 x i32>
187
- ; CHECK-NEXT: [[TMP100 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX3_1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
188
- ; CHECK-NEXT: [[TMP109 :%.*]] = zext <2 x i8> [[TMP100 ]] to <2 x i32>
189
- ; CHECK-NEXT: [[TMP112 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX5_1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
190
- ; CHECK-NEXT: [[TMP114 :%.*]] = zext <2 x i8> [[TMP112 ]] to <2 x i32>
191
- ; CHECK-NEXT: [[TMP124:%.*]] = sub <2 x i32> [[TMP109 ]], [[TMP114 ]]
185
+ ; CHECK-NEXT: [[TMP109 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ADD_PTR644]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
186
+ ; CHECK-NEXT: [[TMP103:%.*]] = zext <2 x i8> [[TMP109 ]] to <2 x i32>
187
+ ; CHECK-NEXT: [[TMP116 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX3_1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
188
+ ; CHECK-NEXT: [[TMP118 :%.*]] = zext <2 x i8> [[TMP116 ]] to <2 x i32>
189
+ ; CHECK-NEXT: [[TMP128 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX5_1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
190
+ ; CHECK-NEXT: [[TMP155 :%.*]] = zext <2 x i8> [[TMP128 ]] to <2 x i32>
191
+ ; CHECK-NEXT: [[TMP124:%.*]] = sub <2 x i32> [[TMP118 ]], [[TMP155 ]]
192
192
; CHECK-NEXT: [[TMP125:%.*]] = shl <2 x i32> [[TMP124]], <i32 16, i32 16>
193
- ; CHECK-NEXT: [[TMP113 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX22_1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
194
- ; CHECK-NEXT: [[TMP111:%.*]] = zext <2 x i8> [[TMP113 ]] to <2 x i32>
195
- ; CHECK-NEXT: [[TMP115 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX25_1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
196
- ; CHECK-NEXT: [[TMP118 :%.*]] = zext <2 x i8> [[TMP115 ]] to <2 x i32>
197
- ; CHECK-NEXT: [[TMP116 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX27_1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
198
- ; CHECK-NEXT: [[TMP128 :%.*]] = zext <2 x i8> [[TMP116 ]] to <2 x i32>
199
- ; CHECK-NEXT: [[TMP135:%.*]] = sub <2 x i32> [[TMP118 ]], [[TMP128 ]]
193
+ ; CHECK-NEXT: [[TMP156 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX22_1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
194
+ ; CHECK-NEXT: [[TMP111:%.*]] = zext <2 x i8> [[TMP156 ]] to <2 x i32>
195
+ ; CHECK-NEXT: [[TMP112 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX25_1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
196
+ ; CHECK-NEXT: [[TMP113 :%.*]] = zext <2 x i8> [[TMP112 ]] to <2 x i32>
197
+ ; CHECK-NEXT: [[TMP114 :%.*]] = call <2 x i8> @llvm.experimental.vp.strided.load.v2i8.p0.i64(ptr align 1 [[ARRAYIDX27_1]], i64 2, <2 x i1> <i1 true, i1 true>, i32 2)
198
+ ; CHECK-NEXT: [[TMP115 :%.*]] = zext <2 x i8> [[TMP114 ]] to <2 x i32>
199
+ ; CHECK-NEXT: [[TMP135:%.*]] = sub <2 x i32> [[TMP113 ]], [[TMP115 ]]
200
200
; CHECK-NEXT: [[TMP136:%.*]] = shl <2 x i32> [[TMP135]], <i32 16, i32 16>
201
201
; CHECK-NEXT: [[TMP137:%.*]] = insertelement <2 x i32> [[TMP110]], i32 [[CONV33_1]], i32 1
202
202
; CHECK-NEXT: [[TMP119:%.*]] = sub <2 x i32> [[TMP137]], [[TMP111]]
@@ -480,11 +480,11 @@ define i32 @test(ptr %pix1, ptr %pix2, i64 %idx.ext, i64 %idx.ext63, ptr %add.pt
480
480
; THR15-NEXT: [[TMP84:%.*]] = sub <2 x i32> [[TMP78]], [[TMP80]]
481
481
; THR15-NEXT: [[TMP85:%.*]] = shl <2 x i32> [[TMP84]], <i32 16, i32 16>
482
482
; THR15-NEXT: [[TMP86:%.*]] = insertelement <2 x i32> [[TMP74]], i32 [[CONV33]], i32 1
483
- ; THR15-NEXT: [[TMP87 :%.*]] = sub <2 x i32> [[TMP86]], [[TMP76]]
484
- ; THR15-NEXT: [[TMP88:%.*]] = add <2 x i32> [[TMP85]], [[TMP87 ]]
483
+ ; THR15-NEXT: [[TMP93 :%.*]] = sub <2 x i32> [[TMP86]], [[TMP76]]
484
+ ; THR15-NEXT: [[TMP88:%.*]] = add <2 x i32> [[TMP85]], [[TMP93 ]]
485
485
; THR15-NEXT: [[TMP92:%.*]] = insertelement <2 x i32> [[TMP74]], i32 [[CONV]], i32 0
486
- ; THR15-NEXT: [[TMP93 :%.*]] = sub <2 x i32> [[TMP92]], [[TMP68]]
487
- ; THR15-NEXT: [[TMP95:%.*]] = add <2 x i32> [[TMP73]], [[TMP93 ]]
486
+ ; THR15-NEXT: [[TMP87 :%.*]] = sub <2 x i32> [[TMP92]], [[TMP68]]
487
+ ; THR15-NEXT: [[TMP95:%.*]] = add <2 x i32> [[TMP73]], [[TMP87 ]]
488
488
; THR15-NEXT: [[TMP97:%.*]] = shufflevector <2 x i32> [[TMP88]], <2 x i32> [[TMP95]], <2 x i32> <i32 0, i32 2>
489
489
; THR15-NEXT: [[TMP77:%.*]] = add <2 x i32> [[TMP88]], [[TMP95]]
490
490
; THR15-NEXT: [[TMP91:%.*]] = sub <2 x i32> [[TMP95]], [[TMP88]]
@@ -521,13 +521,13 @@ define i32 @test(ptr %pix1, ptr %pix2, i64 %idx.ext, i64 %idx.ext63, ptr %add.pt
521
521
; THR15-NEXT: [[TMP113:%.*]] = sub <2 x i32> [[TMP109]], [[TMP111]]
522
522
; THR15-NEXT: [[TMP114:%.*]] = shl <2 x i32> [[TMP113]], <i32 16, i32 16>
523
523
; THR15-NEXT: [[TMP115:%.*]] = insertelement <2 x i32> [[TMP103]], i32 [[CONV33_1]], i32 1
524
- ; THR15-NEXT: [[TMP116 :%.*]] = sub <2 x i32> [[TMP115]], [[TMP107]]
525
- ; THR15-NEXT: [[TMP117 :%.*]] = add <2 x i32> [[TMP114]], [[TMP116 ]]
524
+ ; THR15-NEXT: [[TMP117 :%.*]] = sub <2 x i32> [[TMP115]], [[TMP107]]
525
+ ; THR15-NEXT: [[TMP116 :%.*]] = add <2 x i32> [[TMP114]], [[TMP117 ]]
526
526
; THR15-NEXT: [[TMP126:%.*]] = insertelement <2 x i32> [[TMP103]], i32 [[CONV_1]], i32 0
527
527
; THR15-NEXT: [[TMP127:%.*]] = sub <2 x i32> [[TMP126]], [[TMP99]]
528
528
; THR15-NEXT: [[TMP128:%.*]] = add <2 x i32> [[TMP102]], [[TMP127]]
529
- ; THR15-NEXT: [[TMP106:%.*]] = add <2 x i32> [[TMP117 ]], [[TMP128]]
530
- ; THR15-NEXT: [[TMP121:%.*]] = sub <2 x i32> [[TMP128]], [[TMP117 ]]
529
+ ; THR15-NEXT: [[TMP106:%.*]] = add <2 x i32> [[TMP116 ]], [[TMP128]]
530
+ ; THR15-NEXT: [[TMP121:%.*]] = sub <2 x i32> [[TMP128]], [[TMP116 ]]
531
531
; THR15-NEXT: [[TMP118:%.*]] = extractelement <2 x i32> [[TMP106]], i32 0
532
532
; THR15-NEXT: [[TMP119:%.*]] = extractelement <2 x i32> [[TMP106]], i32 1
533
533
; THR15-NEXT: [[ADD48_1:%.*]] = add i32 [[TMP119]], [[TMP118]]
0 commit comments