265 changes: 105 additions & 160 deletions llvm/test/CodeGen/X86/xaluo.ll
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple=x86_64-darwin-unknown < %s | FileCheck %s --check-prefix=SDAG --check-prefix=GENERIC
; RUN: llc -mtriple=x86_64-darwin-unknown -fast-isel -fast-isel-abort=1 < %s | FileCheck %s --check-prefix=FAST
; RUN: llc -mtriple=x86_64-darwin-unknown -mcpu=knl < %s | FileCheck %s --check-prefix=SDAG --check-prefix=KNL
; RUN: llc -mtriple=x86_64-darwin-unknown < %s | FileCheck %s --check-prefixes=CHECK,SDAG,GENERIC
; RUN: llc -mtriple=x86_64-darwin-unknown -fast-isel -fast-isel-abort=1 < %s | FileCheck %s --check-prefixes=CHECK,FAST
; RUN: llc -mtriple=x86_64-darwin-unknown -mcpu=knl < %s | FileCheck %s --check-prefixes=CHECK,SDAG,KNL

;
; Get the actual value of the overflow bit.
Expand Down Expand Up @@ -550,167 +550,107 @@ define zeroext i1 @usuboi64(i64 %v1, i64 %v2, ptr %res) {
; Check the use of the overflow bit in combination with a select instruction.
;
define i32 @saddoselecti32(i32 %v1, i32 %v2) {
; SDAG-LABEL: saddoselecti32:
; SDAG: ## %bb.0:
; SDAG-NEXT: movl %esi, %eax
; SDAG-NEXT: movl %edi, %ecx
; SDAG-NEXT: addl %esi, %ecx
; SDAG-NEXT: cmovol %edi, %eax
; SDAG-NEXT: retq
;
; FAST-LABEL: saddoselecti32:
; FAST: ## %bb.0:
; FAST-NEXT: movl %esi, %eax
; FAST-NEXT: movl %edi, %ecx
; FAST-NEXT: addl %esi, %ecx
; FAST-NEXT: cmovol %edi, %eax
; FAST-NEXT: retq
; CHECK-LABEL: saddoselecti32:
; CHECK: ## %bb.0:
; CHECK-NEXT: movl %esi, %eax
; CHECK-NEXT: movl %edi, %ecx
; CHECK-NEXT: addl %esi, %ecx
; CHECK-NEXT: cmovol %edi, %eax
; CHECK-NEXT: retq
%t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 %v2)
%obit = extractvalue {i32, i1} %t, 1
%ret = select i1 %obit, i32 %v1, i32 %v2
ret i32 %ret
}

define i64 @saddoselecti64(i64 %v1, i64 %v2) {
; SDAG-LABEL: saddoselecti64:
; SDAG: ## %bb.0:
; SDAG-NEXT: movq %rsi, %rax
; SDAG-NEXT: movq %rdi, %rcx
; SDAG-NEXT: addq %rsi, %rcx
; SDAG-NEXT: cmovoq %rdi, %rax
; SDAG-NEXT: retq
;
; FAST-LABEL: saddoselecti64:
; FAST: ## %bb.0:
; FAST-NEXT: movq %rsi, %rax
; FAST-NEXT: movq %rdi, %rcx
; FAST-NEXT: addq %rsi, %rcx
; FAST-NEXT: cmovoq %rdi, %rax
; FAST-NEXT: retq
; CHECK-LABEL: saddoselecti64:
; CHECK: ## %bb.0:
; CHECK-NEXT: movq %rsi, %rax
; CHECK-NEXT: movq %rdi, %rcx
; CHECK-NEXT: addq %rsi, %rcx
; CHECK-NEXT: cmovoq %rdi, %rax
; CHECK-NEXT: retq
%t = call {i64, i1} @llvm.sadd.with.overflow.i64(i64 %v1, i64 %v2)
%obit = extractvalue {i64, i1} %t, 1
%ret = select i1 %obit, i64 %v1, i64 %v2
ret i64 %ret
}

define i32 @uaddoselecti32(i32 %v1, i32 %v2) {
; SDAG-LABEL: uaddoselecti32:
; SDAG: ## %bb.0:
; SDAG-NEXT: movl %esi, %eax
; SDAG-NEXT: movl %edi, %ecx
; SDAG-NEXT: addl %esi, %ecx
; SDAG-NEXT: cmovbl %edi, %eax
; SDAG-NEXT: retq
;
; FAST-LABEL: uaddoselecti32:
; FAST: ## %bb.0:
; FAST-NEXT: movl %esi, %eax
; FAST-NEXT: movl %edi, %ecx
; FAST-NEXT: addl %esi, %ecx
; FAST-NEXT: cmovbl %edi, %eax
; FAST-NEXT: retq
; CHECK-LABEL: uaddoselecti32:
; CHECK: ## %bb.0:
; CHECK-NEXT: movl %esi, %eax
; CHECK-NEXT: movl %edi, %ecx
; CHECK-NEXT: addl %esi, %ecx
; CHECK-NEXT: cmovbl %edi, %eax
; CHECK-NEXT: retq
%t = call {i32, i1} @llvm.uadd.with.overflow.i32(i32 %v1, i32 %v2)
%obit = extractvalue {i32, i1} %t, 1
%ret = select i1 %obit, i32 %v1, i32 %v2
ret i32 %ret
}

define i64 @uaddoselecti64(i64 %v1, i64 %v2) {
; SDAG-LABEL: uaddoselecti64:
; SDAG: ## %bb.0:
; SDAG-NEXT: movq %rsi, %rax
; SDAG-NEXT: movq %rdi, %rcx
; SDAG-NEXT: addq %rsi, %rcx
; SDAG-NEXT: cmovbq %rdi, %rax
; SDAG-NEXT: retq
;
; FAST-LABEL: uaddoselecti64:
; FAST: ## %bb.0:
; FAST-NEXT: movq %rsi, %rax
; FAST-NEXT: movq %rdi, %rcx
; FAST-NEXT: addq %rsi, %rcx
; FAST-NEXT: cmovbq %rdi, %rax
; FAST-NEXT: retq
; CHECK-LABEL: uaddoselecti64:
; CHECK: ## %bb.0:
; CHECK-NEXT: movq %rsi, %rax
; CHECK-NEXT: movq %rdi, %rcx
; CHECK-NEXT: addq %rsi, %rcx
; CHECK-NEXT: cmovbq %rdi, %rax
; CHECK-NEXT: retq
%t = call {i64, i1} @llvm.uadd.with.overflow.i64(i64 %v1, i64 %v2)
%obit = extractvalue {i64, i1} %t, 1
%ret = select i1 %obit, i64 %v1, i64 %v2
ret i64 %ret
}

define i32 @ssuboselecti32(i32 %v1, i32 %v2) {
; SDAG-LABEL: ssuboselecti32:
; SDAG: ## %bb.0:
; SDAG-NEXT: movl %esi, %eax
; SDAG-NEXT: cmpl %esi, %edi
; SDAG-NEXT: cmovol %edi, %eax
; SDAG-NEXT: retq
;
; FAST-LABEL: ssuboselecti32:
; FAST: ## %bb.0:
; FAST-NEXT: movl %esi, %eax
; FAST-NEXT: cmpl %esi, %edi
; FAST-NEXT: cmovol %edi, %eax
; FAST-NEXT: retq
; CHECK-LABEL: ssuboselecti32:
; CHECK: ## %bb.0:
; CHECK-NEXT: movl %esi, %eax
; CHECK-NEXT: cmpl %esi, %edi
; CHECK-NEXT: cmovol %edi, %eax
; CHECK-NEXT: retq
%t = call {i32, i1} @llvm.ssub.with.overflow.i32(i32 %v1, i32 %v2)
%obit = extractvalue {i32, i1} %t, 1
%ret = select i1 %obit, i32 %v1, i32 %v2
ret i32 %ret
}

define i64 @ssuboselecti64(i64 %v1, i64 %v2) {
; SDAG-LABEL: ssuboselecti64:
; SDAG: ## %bb.0:
; SDAG-NEXT: movq %rsi, %rax
; SDAG-NEXT: cmpq %rsi, %rdi
; SDAG-NEXT: cmovoq %rdi, %rax
; SDAG-NEXT: retq
;
; FAST-LABEL: ssuboselecti64:
; FAST: ## %bb.0:
; FAST-NEXT: movq %rsi, %rax
; FAST-NEXT: cmpq %rsi, %rdi
; FAST-NEXT: cmovoq %rdi, %rax
; FAST-NEXT: retq
; CHECK-LABEL: ssuboselecti64:
; CHECK: ## %bb.0:
; CHECK-NEXT: movq %rsi, %rax
; CHECK-NEXT: cmpq %rsi, %rdi
; CHECK-NEXT: cmovoq %rdi, %rax
; CHECK-NEXT: retq
%t = call {i64, i1} @llvm.ssub.with.overflow.i64(i64 %v1, i64 %v2)
%obit = extractvalue {i64, i1} %t, 1
%ret = select i1 %obit, i64 %v1, i64 %v2
ret i64 %ret
}

define i32 @usuboselecti32(i32 %v1, i32 %v2) {
; SDAG-LABEL: usuboselecti32:
; SDAG: ## %bb.0:
; SDAG-NEXT: movl %esi, %eax
; SDAG-NEXT: cmpl %esi, %edi
; SDAG-NEXT: cmovbl %edi, %eax
; SDAG-NEXT: retq
;
; FAST-LABEL: usuboselecti32:
; FAST: ## %bb.0:
; FAST-NEXT: movl %esi, %eax
; FAST-NEXT: cmpl %esi, %edi
; FAST-NEXT: cmovbl %edi, %eax
; FAST-NEXT: retq
; CHECK-LABEL: usuboselecti32:
; CHECK: ## %bb.0:
; CHECK-NEXT: movl %esi, %eax
; CHECK-NEXT: cmpl %esi, %edi
; CHECK-NEXT: cmovbl %edi, %eax
; CHECK-NEXT: retq
%t = call {i32, i1} @llvm.usub.with.overflow.i32(i32 %v1, i32 %v2)
%obit = extractvalue {i32, i1} %t, 1
%ret = select i1 %obit, i32 %v1, i32 %v2
ret i32 %ret
}

define i64 @usuboselecti64(i64 %v1, i64 %v2) {
; SDAG-LABEL: usuboselecti64:
; SDAG: ## %bb.0:
; SDAG-NEXT: movq %rsi, %rax
; SDAG-NEXT: cmpq %rsi, %rdi
; SDAG-NEXT: cmovbq %rdi, %rax
; SDAG-NEXT: retq
;
; FAST-LABEL: usuboselecti64:
; FAST: ## %bb.0:
; FAST-NEXT: movq %rsi, %rax
; FAST-NEXT: cmpq %rsi, %rdi
; FAST-NEXT: cmovbq %rdi, %rax
; FAST-NEXT: retq
; CHECK-LABEL: usuboselecti64:
; CHECK: ## %bb.0:
; CHECK-NEXT: movq %rsi, %rax
; CHECK-NEXT: cmpq %rsi, %rdi
; CHECK-NEXT: cmovbq %rdi, %rax
; CHECK-NEXT: retq
%t = call {i64, i1} @llvm.usub.with.overflow.i64(i64 %v1, i64 %v2)
%obit = extractvalue {i64, i1} %t, 1
%ret = select i1 %obit, i64 %v1, i64 %v2
Expand Down Expand Up @@ -1024,42 +964,56 @@ continue:
ret i1 true
}

define {i64, i1} @saddoovf(i64 %a, i64 %b) {
; CHECK-LABEL: saddoovf:
; CHECK: ## %bb.0:
; CHECK-NEXT: sarq $17, %rdi
; CHECK-NEXT: shrq $31, %rsi
; CHECK-NEXT: leaq (%rsi,%rdi), %rax
; CHECK-NEXT: xorl %edx, %edx
; CHECK-NEXT: retq
%1 = ashr i64 %a, 17
%2 = lshr i64 %b, 31
%t = call {i64, i1} @llvm.sadd.with.overflow.i64(i64 %1, i64 %2)
ret {i64, i1} %t
}

; FIXME: Failure to recognise sub can't overflow
define {i64, i1} @ssuboovf(i64 %a, i64 %b) {
; CHECK-LABEL: ssuboovf:
; CHECK: ## %bb.0:
; CHECK-NEXT: movzwl %di, %eax
; CHECK-NEXT: shrq $22, %rsi
; CHECK-NEXT: subq %rsi, %rax
; CHECK-NEXT: seto %dl
; CHECK-NEXT: retq
%1 = and i64 %a, 65535
%2 = lshr i64 %b, 22
%t = call {i64, i1} @llvm.ssub.with.overflow.i64(i64 %1, i64 %2)
ret {i64, i1} %t
}

define {i64, i1} @uaddoovf(i64 %a, i64 %b) {
; SDAG-LABEL: uaddoovf:
; SDAG: ## %bb.0:
; SDAG-NEXT: movzbl %dil, %ecx
; SDAG-NEXT: movzbl %sil, %eax
; SDAG-NEXT: addq %rcx, %rax
; SDAG-NEXT: xorl %edx, %edx
; SDAG-NEXT: retq
;
; FAST-LABEL: uaddoovf:
; FAST: ## %bb.0:
; FAST-NEXT: movzbl %dil, %ecx
; FAST-NEXT: movzbl %sil, %eax
; FAST-NEXT: addq %rcx, %rax
; FAST-NEXT: xorl %edx, %edx
; FAST-NEXT: retq
; CHECK-LABEL: uaddoovf:
; CHECK: ## %bb.0:
; CHECK-NEXT: movzbl %dil, %ecx
; CHECK-NEXT: movzbl %sil, %eax
; CHECK-NEXT: addq %rcx, %rax
; CHECK-NEXT: xorl %edx, %edx
; CHECK-NEXT: retq
%1 = and i64 %a, 255
%2 = and i64 %b, 255
%t = call {i64, i1} @llvm.uadd.with.overflow.i64(i64 %1, i64 %2)
ret {i64, i1} %t
}

define {i64, i1} @usuboovf(i64 %a, i64 %b) {
; SDAG-LABEL: usuboovf:
; SDAG: ## %bb.0:
; SDAG-NEXT: movq %rsi, %rax
; SDAG-NEXT: notq %rax
; SDAG-NEXT: xorl %edx, %edx
; SDAG-NEXT: retq
;
; FAST-LABEL: usuboovf:
; FAST: ## %bb.0:
; FAST-NEXT: movq %rsi, %rax
; FAST-NEXT: notq %rax
; FAST-NEXT: xorl %edx, %edx
; FAST-NEXT: retq
; CHECK-LABEL: usuboovf:
; CHECK: ## %bb.0:
; CHECK-NEXT: movq %rsi, %rax
; CHECK-NEXT: notq %rax
; CHECK-NEXT: xorl %edx, %edx
; CHECK-NEXT: retq
%t0 = call {i64, i1} @llvm.usub.with.overflow.i64(i64 %a, i64 %a)
%v0 = extractvalue {i64, i1} %t0, 0
%o0 = extractvalue {i64, i1} %t0, 1
Expand All @@ -1077,23 +1031,14 @@ define {i64, i1} @usuboovf(i64 %a, i64 %b) {

; Make sure we select an INC for both the data use and the flag use.
define i32 @incovfselectstore(i32 %v1, i32 %v2, ptr %x) {
; SDAG-LABEL: incovfselectstore:
; SDAG: ## %bb.0:
; SDAG-NEXT: movl %esi, %eax
; SDAG-NEXT: movl %edi, %ecx
; SDAG-NEXT: incl %ecx
; SDAG-NEXT: cmovol %edi, %eax
; SDAG-NEXT: movl %ecx, (%rdx)
; SDAG-NEXT: retq
;
; FAST-LABEL: incovfselectstore:
; FAST: ## %bb.0:
; FAST-NEXT: movl %esi, %eax
; FAST-NEXT: movl %edi, %ecx
; FAST-NEXT: incl %ecx
; FAST-NEXT: cmovol %edi, %eax
; FAST-NEXT: movl %ecx, (%rdx)
; FAST-NEXT: retq
; CHECK-LABEL: incovfselectstore:
; CHECK: ## %bb.0:
; CHECK-NEXT: movl %esi, %eax
; CHECK-NEXT: movl %edi, %ecx
; CHECK-NEXT: incl %ecx
; CHECK-NEXT: cmovol %edi, %eax
; CHECK-NEXT: movl %ecx, (%rdx)
; CHECK-NEXT: retq
%t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 1)
%obit = extractvalue {i32, i1} %t, 1
%ret = select i1 %obit, i32 %v1, i32 %v2
Expand Down