1
- ; RUN: opt < %s -loop-vectorize -instcombine - mtriple aarch64-unknown-linux-gnu -enable-strict-reductions -S | FileCheck %s -check-prefix=CHECK
1
+ ; RUN: opt < %s -loop-vectorize -mtriple aarch64-unknown-linux-gnu -enable-strict-reductions -S | FileCheck %s -check-prefix=CHECK
2
2
3
3
define float @fadd_strict (float * noalias nocapture readonly %a , i64 %n ) {
4
4
; CHECK-LABEL: @fadd_strict
@@ -30,14 +30,17 @@ define float @fadd_strict_unroll(float* noalias nocapture readonly %a, i64 %n) {
30
30
; CHECK-LABEL: @fadd_strict_unroll
31
31
; CHECK: vector.body:
32
32
; CHECK: %[[VEC_PHI1:.*]] = phi float [ 0.000000e+00, %vector.ph ], [ %[[RDX4:.*]], %vector.body ]
33
+ ; CHECK: %[[VEC_PHI2:.*]] = phi float [ -0.000000e+00, %vector.ph ], [ %[[RDX4]], %vector.body ]
34
+ ; CHECK: %[[VEC_PHI3:.*]] = phi float [ -0.000000e+00, %vector.ph ], [ %[[RDX4]], %vector.body ]
35
+ ; CHECK: %[[VEC_PHI4:.*]] = phi float [ -0.000000e+00, %vector.ph ], [ %[[RDX4]], %vector.body ]
33
36
; CHECK: %[[LOAD1:.*]] = load <8 x float>, <8 x float>*
34
37
; CHECK: %[[LOAD2:.*]] = load <8 x float>, <8 x float>*
35
38
; CHECK: %[[LOAD3:.*]] = load <8 x float>, <8 x float>*
36
39
; CHECK: %[[LOAD4:.*]] = load <8 x float>, <8 x float>*
37
40
; CHECK: %[[RDX1:.*]] = call float @llvm.vector.reduce.fadd.v8f32(float %[[VEC_PHI1]], <8 x float> %[[LOAD1]])
38
41
; CHECK: %[[RDX2:.*]] = call float @llvm.vector.reduce.fadd.v8f32(float %[[RDX1]], <8 x float> %[[LOAD2]])
39
42
; CHECK: %[[RDX3:.*]] = call float @llvm.vector.reduce.fadd.v8f32(float %[[RDX2]], <8 x float> %[[LOAD3]])
40
- ; CHECK: %[[RDX4:.* ]] = call float @llvm.vector.reduce.fadd.v8f32(float %[[RDX3]], <8 x float> %[[LOAD4]])
43
+ ; CHECK: %[[RDX4]] = call float @llvm.vector.reduce.fadd.v8f32(float %[[RDX3]], <8 x float> %[[LOAD4]])
41
44
; CHECK: for.end
42
45
; CHECK: %[[PHI:.*]] = phi float [ %[[SCALAR:.*]], %for.body ], [ %[[RDX4]], %middle.block ]
43
46
; CHECK: ret float %[[PHI]]
@@ -148,7 +151,8 @@ define float @fadd_conditional(float* noalias nocapture readonly %a, float* noal
148
151
; CHECK: br i1 %[[EXTRACT]], label %pred.load.if, label %pred.load.continue
149
152
; CHECK: pred.load.continue6
150
153
; CHECK: %[[PHI1:.*]] = phi <4 x float> [ %[[PHI0:.*]], %pred.load.continue4 ], [ %[[INS_ELT:.*]], %pred.load.if5 ]
151
- ; CHECK: %[[PRED:.*]] = select <4 x i1> %[[FCMP1]], <4 x float> %[[PHI1]], <4 x float> <float 3.000000e+00, float 3.000000e+00, float 3.000000e+00, float 3.000000e+00>
154
+ ; CHECK: %[[XOR:.*]] = xor <4 x i1> %[[FCMP1]], <i1 true, i1 true, i1 true, i1 true>
155
+ ; CHECK: %[[PRED:.*]] = select <4 x i1> %[[XOR]], <4 x float> <float 3.000000e+00, float 3.000000e+00, float 3.000000e+00, float 3.000000e+00>, <4 x float> %[[PHI1]]
152
156
; CHECK: %[[RDX]] = call float @llvm.vector.reduce.fadd.v4f32(float %[[PHI]], <4 x float> %[[PRED]])
153
157
; CHECK: for.body
154
158
; CHECK: %[[RES_PHI:.*]] = phi float [ %[[MERGE_RDX:.*]], %scalar.ph ], [ %[[FADD:.*]], %for.inc ]
@@ -196,7 +200,7 @@ for.end:
196
200
define float @fadd_predicated (float * noalias nocapture %a , i64 %n ) {
197
201
; CHECK-LABEL: @fadd_predicated
198
202
; CHECK: vector.ph
199
- ; CHECK: %[[TRIP_MINUS_ONE:.*]] = add i64 %n, - 1
203
+ ; CHECK: %[[TRIP_MINUS_ONE:.*]] = sub i64 %n, 1
200
204
; CHECK: %[[BROADCAST_INS:.*]] = insertelement <2 x i64> poison, i64 %[[TRIP_MINUS_ONE]], i32 0
201
205
; CHECK: %[[SPLAT:.*]] = shufflevector <2 x i64> %[[BROADCAST_INS]], <2 x i64> poison, <2 x i32> zeroinitializer
202
206
; CHECK: vector.body
@@ -206,7 +210,7 @@ define float @fadd_predicated(float* noalias nocapture %a, i64 %n) {
206
210
; CHECK: %[[MASK:.*]] = select <2 x i1> %0, <2 x float> %[[PHI]], <2 x float> <float -0.000000e+00, float -0.000000e+00>
207
211
; CHECK: %[[RDX]] = call float @llvm.vector.reduce.fadd.v2f32(float %[[RDX_PHI]], <2 x float> %[[MASK]])
208
212
; CHECK: for.end:
209
- ; CHECK: %[[RES_PHI:.*]] = phi float [ undef , %for.body ], [ %[[RDX]], %middle.block ]
213
+ ; CHECK: %[[RES_PHI:.*]] = phi float [ %[[FADD:.*]] , %for.body ], [ %[[RDX]], %middle.block ]
210
214
; CHECK: ret float %[[RES_PHI]]
211
215
entry:
212
216
br label %for.body
0 commit comments