Skip to content

Commit

Permalink
Revert "[AArch64] Adjust operand sequence for Add+Sub to combine more…
Browse files Browse the repository at this point in the history
… inline shift"

This reverts commit ada9ab6.
  • Loading branch information
bcl5980 committed Oct 28, 2022
1 parent 9481e4b commit dfb16bd
Show file tree
Hide file tree
Showing 2 changed files with 9 additions and 55 deletions.
31 changes: 0 additions & 31 deletions llvm/lib/Target/AArch64/AArch64ISelLowering.cpp
Expand Up @@ -16854,32 +16854,6 @@ static SDValue performBuildVectorCombine(SDNode *N,
return SDValue();
}

// ((X >> C) - Y) + Z --> (Z - Y) + (X >> C)
static SDValue performAddCombineSubShift(SDNode *N, SDValue SUB, SDValue Z,
SelectionDAG &DAG) {
// DAGCombiner will revert the combination when Z is constant cause
// dead loop. So don't enable the combination when Z is constant.
if (isa<ConstantSDNode>(Z))
return SDValue();

if (SUB.getOpcode() != ISD::SUB || !SUB.hasOneUse())
return SDValue();

SDValue SHL = SUB.getOperand(0);
if (SHL.getOpcode() != ISD::SHL || !SHL.hasOneUse())
return SDValue();

if (!isa<ConstantSDNode>(SHL.getOperand(1)))
return SDValue();

SDLoc DL(N);
EVT VT = N->getValueType(0);

SDValue Y = SUB.getOperand(1);
SDValue NewSub = DAG.getNode(ISD::SUB, DL, VT, Z, Y);
return DAG.getNode(ISD::ADD, DL, VT, NewSub, SHL);
}

static SDValue performAddCombineForShiftedOperands(SDNode *N,
SelectionDAG &DAG) {
// NOTE: Swapping LHS and RHS is not done for SUB, since SUB is not
Expand All @@ -16897,11 +16871,6 @@ static SDValue performAddCombineForShiftedOperands(SDNode *N,
SDValue LHS = N->getOperand(0);
SDValue RHS = N->getOperand(1);

if (SDValue Val = performAddCombineSubShift(N, LHS, RHS, DAG))
return Val;
if (SDValue Val = performAddCombineSubShift(N, RHS, LHS, DAG))
return Val;

uint64_t LHSImm = 0, RHSImm = 0;
// If both operand are shifted by imm and shift amount is not greater than 4
// for one operand, swap LHS and RHS to put operand with smaller shift amount
Expand Down
33 changes: 9 additions & 24 deletions llvm/test/CodeGen/AArch64/addsub.ll
Expand Up @@ -694,55 +694,40 @@ if.end: ; preds = %if.then, %lor.lhs.f
ret i32 undef
}

; ((X >> C) - Y) + Z --> (Z - Y) + (X >> C)
define i32 @commute_subop0(i32 %x, i32 %y, i32 %z) {
; CHECK-LABEL: commute_subop0:
; CHECK: // %bb.0:
; CHECK-NEXT: sub w8, w2, w1
; CHECK-NEXT: add w0, w8, w0, lsl #3
; CHECK-NEXT: lsl w8, w0, #3
; CHECK-NEXT: sub w8, w8, w1
; CHECK-NEXT: add w0, w8, w2
; CHECK-NEXT: ret
%shl = shl i32 %x, 3
%sub = sub i32 %shl, %y
%add = add i32 %sub, %z
ret i32 %add
}

; Z + ((X >> C) - Y) --> (Z - Y) + (X >> C)
define i32 @commute_subop0_cadd(i32 %x, i32 %y, i32 %z) {
; CHECK-LABEL: commute_subop0_cadd:
; CHECK: // %bb.0:
; CHECK-NEXT: sub w8, w2, w1
; CHECK-NEXT: add w0, w8, w0, lsl #3
; CHECK-NEXT: lsl w8, w0, #3
; CHECK-NEXT: sub w8, w8, w1
; CHECK-NEXT: add w0, w2, w8
; CHECK-NEXT: ret
%shl = shl i32 %x, 3
%sub = sub i32 %shl, %y
%add = add i32 %z, %sub
ret i32 %add
}

; Y + ((X >> C) - X) --> (Y - X) + (X >> C)
define i32 @commute_subop0_mul(i32 %x, i32 %y) {
; CHECK-LABEL: commute_subop0_mul:
; CHECK: // %bb.0:
; CHECK-NEXT: sub w8, w1, w0
; CHECK-NEXT: add w0, w8, w0, lsl #3
; CHECK-NEXT: lsl w8, w0, #3
; CHECK-NEXT: sub w8, w8, w0
; CHECK-NEXT: add w0, w8, w1
; CHECK-NEXT: ret
%mul = mul i32 %x, 7
%add = add i32 %mul, %y
ret i32 %add
}

; negative case for ((X >> C) - Y) + Z --> (Z - Y) + (X >> C)
; Z can't be constant to avoid dead loop
define i32 @commute_subop0_zconst(i32 %x, i32 %y) {
; CHECK-LABEL: commute_subop0_zconst:
; CHECK: // %bb.0:
; CHECK-NEXT: lsl w8, w0, #3
; CHECK-NEXT: sub w8, w8, w1
; CHECK-NEXT: add w0, w8, #1
; CHECK-NEXT: ret
%shl = shl i32 %x, 3
%sub = sub i32 %shl, %y
%add = add i32 %sub, 1
ret i32 %add
}

0 comments on commit dfb16bd

Please sign in to comment.