Skip to content

Commit

Permalink
[x86] Improve select lowering for smin(x, 0) & smax(x, 0)
Browse files Browse the repository at this point in the history
smin(x, 0):
  (select (x < 0), x, 0) -> ((x >> (size_in_bits(x)-1))) & x

smax(x, 0):
  (select (x > 0), x, 0) -> (~(x >> (size_in_bits(x)-1))) & x
  The comparison is testing for a positive value, we have to invert the sign
  bit mask, so only do that transform if the target has a bitwise 'and not'
  instruction (the invert is free).

The transform is performed only when CMP has a single user to avoid
increasing total instruction number.

https://alive2.llvm.org/ce/z/euUnNm
https://alive2.llvm.org/ce/z/37339J

Differential Revision: https://reviews.llvm.org/D123109
  • Loading branch information
williamweixiao committed Apr 7, 2022
1 parent 674ee4d commit 842d0bf
Show file tree
Hide file tree
Showing 2 changed files with 52 additions and 19 deletions.
18 changes: 18 additions & 0 deletions llvm/lib/Target/X86/X86ISelLowering.cpp
Expand Up @@ -24699,6 +24699,8 @@ SDValue X86TargetLowering::LowerSELECT(SDValue Op, SelectionDAG &DAG) const {
// (select (x != 0), -1, y) -> ~(sign_bit (x - 1)) | y
// (select (and (x , 0x1) == 0), y, (z ^ y) ) -> (-(and (x , 0x1)) & z ) ^ y
// (select (and (x , 0x1) == 0), y, (z | y) ) -> (-(and (x , 0x1)) & z ) | y
// (select (x > 0), x, 0) -> (~(x >> (size_in_bits(x)-1))) & x
// (select (x < 0), x, 0) -> ((x >> (size_in_bits(x)-1))) & x
if (Cond.getOpcode() == X86ISD::SETCC &&
Cond.getOperand(1).getOpcode() == X86ISD::CMP &&
isNullConstant(Cond.getOperand(1).getOperand(1))) {
Expand Down Expand Up @@ -24779,6 +24781,22 @@ SDValue X86TargetLowering::LowerSELECT(SDValue Op, SelectionDAG &DAG) const {
SDValue And = DAG.getNode(ISD::AND, DL, VT, Mask, Src1); // Mask & z
return DAG.getNode(Op2.getOpcode(), DL, VT, And, Src2); // And Op y
}
} else if ((VT == MVT::i32 || VT == MVT::i64) && isNullConstant(Op2) &&
Cmp.getNode()->hasOneUse() && (CmpOp0 == Op1) &&
((CondCode == X86::COND_S) || // smin(x, 0)
(CondCode == X86::COND_G && hasAndNot(Op1)))) { // smax(x, 0)
// (select (x < 0), x, 0) -> ((x >> (size_in_bits(x)-1))) & x
//
// If the comparison is testing for a positive value, we have to invert
// the sign bit mask, so only do that transform if the target has a
// bitwise 'and not' instruction (the invert is free).
// (select (x > 0), x, 0) -> (~(x >> (size_in_bits(x)-1))) & x
unsigned ShCt = VT.getSizeInBits() - 1;
SDValue ShiftAmt = DAG.getConstant(ShCt, DL, VT);
SDValue Shift = DAG.getNode(ISD::SRA, DL, VT, Op1, ShiftAmt);
if (CondCode == X86::COND_G)
Shift = DAG.getNOT(DL, Shift, VT);
return DAG.getNode(ISD::AND, DL, VT, Shift, Op1);
}
}

Expand Down
53 changes: 34 additions & 19 deletions llvm/test/CodeGen/X86/select-smin-smax.ll
@@ -1,50 +1,65 @@
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+bmi < %s | FileCheck %s
; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=-bmi < %s | FileCheck %s --check-prefixes=CHECK,CHECK-NOBMI
; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+bmi < %s | FileCheck %s --check-prefixes=CHECK,CHECK-BMI

declare i32 @llvm.smax.i32(i32, i32)
declare i32 @llvm.smin.i32(i32, i32)
declare i64 @llvm.smax.i64(i64, i64)
declare i64 @llvm.smin.i64(i64, i64)

define i32 @test_i32_smax(i32 %a) nounwind {
; CHECK-LABEL: test_i32_smax:
; CHECK: # %bb.0:
; CHECK-NEXT: xorl %eax, %eax
; CHECK-NEXT: testl %edi, %edi
; CHECK-NEXT: cmovgl %edi, %eax
; CHECK-NEXT: retq
; CHECK-NOBMI-LABEL: test_i32_smax:
; CHECK-NOBMI: # %bb.0:
; CHECK-NOBMI-NEXT: xorl %eax, %eax
; CHECK-NOBMI-NEXT: testl %edi, %edi
; CHECK-NOBMI-NEXT: cmovgl %edi, %eax
; CHECK-NOBMI-NEXT: retq
;
; CHECK-BMI-LABEL: test_i32_smax:
; CHECK-BMI: # %bb.0:
; CHECK-BMI-NEXT: movl %edi, %eax
; CHECK-BMI-NEXT: sarl $31, %eax
; CHECK-BMI-NEXT: andnl %edi, %eax, %eax
; CHECK-BMI-NEXT: retq
%r = call i32 @llvm.smax.i32(i32 %a, i32 0)
ret i32 %r
}

define i32 @test_i32_smin(i32 %a) nounwind {
; CHECK-LABEL: test_i32_smin:
; CHECK: # %bb.0:
; CHECK-NEXT: xorl %eax, %eax
; CHECK-NEXT: testl %edi, %edi
; CHECK-NEXT: cmovsl %edi, %eax
; CHECK-NEXT: movl %edi, %eax
; CHECK-NEXT: sarl $31, %eax
; CHECK-NEXT: andl %edi, %eax
; CHECK-NEXT: retq
%r = call i32 @llvm.smin.i32(i32 %a, i32 0)
ret i32 %r
}

define i64 @test_i64_smax(i64 %a) nounwind {
; CHECK-LABEL: test_i64_smax:
; CHECK: # %bb.0:
; CHECK-NEXT: xorl %eax, %eax
; CHECK-NEXT: testq %rdi, %rdi
; CHECK-NEXT: cmovgq %rdi, %rax
; CHECK-NEXT: retq
; CHECK-NOBMI-LABEL: test_i64_smax:
; CHECK-NOBMI: # %bb.0:
; CHECK-NOBMI-NEXT: xorl %eax, %eax
; CHECK-NOBMI-NEXT: testq %rdi, %rdi
; CHECK-NOBMI-NEXT: cmovgq %rdi, %rax
; CHECK-NOBMI-NEXT: retq
;
; CHECK-BMI-LABEL: test_i64_smax:
; CHECK-BMI: # %bb.0:
; CHECK-BMI-NEXT: movq %rdi, %rax
; CHECK-BMI-NEXT: sarq $63, %rax
; CHECK-BMI-NEXT: andnq %rdi, %rax, %rax
; CHECK-BMI-NEXT: retq
%r = call i64 @llvm.smax.i64(i64 %a, i64 0)
ret i64 %r
}

define i64 @test_i64_smin(i64 %a) nounwind {
; CHECK-LABEL: test_i64_smin:
; CHECK: # %bb.0:
; CHECK-NEXT: xorl %eax, %eax
; CHECK-NEXT: testq %rdi, %rdi
; CHECK-NEXT: cmovsq %rdi, %rax
; CHECK-NEXT: movq %rdi, %rax
; CHECK-NEXT: sarq $63, %rax
; CHECK-NEXT: andq %rdi, %rax
; CHECK-NEXT: retq
%r = call i64 @llvm.smin.i64(i64 %a, i64 0)
ret i64 %r
Expand Down

0 comments on commit 842d0bf

Please sign in to comment.