Skip to content

Commit

Permalink
Precommit test for redundant mvn instructions
Browse files Browse the repository at this point in the history
  • Loading branch information
MacDue authored and c-rhodes committed Nov 4, 2022
1 parent 6875ac6 commit 901e5a7
Showing 1 changed file with 87 additions and 0 deletions.
@@ -0,0 +1,87 @@
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple=aarch64 < %s | FileCheck %s

; All tests are doing unordered vector comparisons on vectors larger than a
; Neon vector.

define i1 @unordered_floating_point_compare_on_v8f32(<8 x float> %a_vec) {
; CHECK-LABEL: unordered_floating_point_compare_on_v8f32:
; CHECK: // %bb.0:
; CHECK-NEXT: fcmgt v1.4s, v1.4s, #0.0
; CHECK-NEXT: mov w8, #1
; CHECK-NEXT: fcmgt v0.4s, v0.4s, #0.0
; CHECK-NEXT: mvn v1.16b, v1.16b
; CHECK-NEXT: mvn v0.16b, v0.16b
; CHECK-NEXT: uzp1 v0.8h, v0.8h, v1.8h
; CHECK-NEXT: xtn v0.8b, v0.8h
; CHECK-NEXT: umaxv b0, v0.8b
; CHECK-NEXT: fmov w9, s0
; CHECK-NEXT: bic w0, w8, w9
; CHECK-NEXT: ret
%a_cmp = fcmp ule <8 x float> %a_vec, zeroinitializer
%cmp_result = bitcast <8 x i1> %a_cmp to i8
%all_zero = icmp eq i8 %cmp_result, 0
ret i1 %all_zero
}

define i1 @unordered_floating_point_compare_on_v16f32(<16 x float> %a_vec) {
; CHECK-LABEL: unordered_floating_point_compare_on_v16f32:
; CHECK: // %bb.0:
; CHECK-NEXT: fcmgt v3.4s, v3.4s, #0.0
; CHECK-NEXT: mov w8, #1
; CHECK-NEXT: fcmgt v2.4s, v2.4s, #0.0
; CHECK-NEXT: fcmgt v1.4s, v1.4s, #0.0
; CHECK-NEXT: fcmgt v0.4s, v0.4s, #0.0
; CHECK-NEXT: mvn v3.16b, v3.16b
; CHECK-NEXT: mvn v2.16b, v2.16b
; CHECK-NEXT: mvn v1.16b, v1.16b
; CHECK-NEXT: mvn v0.16b, v0.16b
; CHECK-NEXT: uzp1 v2.8h, v2.8h, v3.8h
; CHECK-NEXT: uzp1 v0.8h, v0.8h, v1.8h
; CHECK-NEXT: uzp1 v0.16b, v0.16b, v2.16b
; CHECK-NEXT: umaxv b0, v0.16b
; CHECK-NEXT: fmov w9, s0
; CHECK-NEXT: bic w0, w8, w9
; CHECK-NEXT: ret
%a_cmp = fcmp ule <16 x float> %a_vec, zeroinitializer
%cmp_result = bitcast <16 x i1> %a_cmp to i16
%all_zero = icmp eq i16 %cmp_result, 0
ret i1 %all_zero
}

define i1 @unordered_floating_point_compare_on_v32f32(<32 x float> %a_vec) {
; CHECK-LABEL: unordered_floating_point_compare_on_v32f32:
; CHECK: // %bb.0:
; CHECK-NEXT: fcmgt v7.4s, v7.4s, #0.0
; CHECK-NEXT: mov w9, #1
; CHECK-NEXT: fcmgt v6.4s, v6.4s, #0.0
; CHECK-NEXT: fcmgt v5.4s, v5.4s, #0.0
; CHECK-NEXT: fcmgt v4.4s, v4.4s, #0.0
; CHECK-NEXT: fcmgt v3.4s, v3.4s, #0.0
; CHECK-NEXT: fcmgt v2.4s, v2.4s, #0.0
; CHECK-NEXT: fcmgt v1.4s, v1.4s, #0.0
; CHECK-NEXT: fcmgt v0.4s, v0.4s, #0.0
; CHECK-NEXT: mvn v7.16b, v7.16b
; CHECK-NEXT: mvn v6.16b, v6.16b
; CHECK-NEXT: mvn v5.16b, v5.16b
; CHECK-NEXT: mvn v4.16b, v4.16b
; CHECK-NEXT: mvn v3.16b, v3.16b
; CHECK-NEXT: mvn v2.16b, v2.16b
; CHECK-NEXT: mvn v1.16b, v1.16b
; CHECK-NEXT: mvn v0.16b, v0.16b
; CHECK-NEXT: uzp1 v6.8h, v6.8h, v7.8h
; CHECK-NEXT: uzp1 v4.8h, v4.8h, v5.8h
; CHECK-NEXT: uzp1 v2.8h, v2.8h, v3.8h
; CHECK-NEXT: uzp1 v0.8h, v0.8h, v1.8h
; CHECK-NEXT: uzp1 v1.16b, v4.16b, v6.16b
; CHECK-NEXT: uzp1 v0.16b, v0.16b, v2.16b
; CHECK-NEXT: orr v0.16b, v0.16b, v1.16b
; CHECK-NEXT: umaxv b0, v0.16b
; CHECK-NEXT: fmov w8, s0
; CHECK-NEXT: bic w0, w9, w8
; CHECK-NEXT: ret
%a_cmp = fcmp ule <32 x float> %a_vec, zeroinitializer
%cmp_result = bitcast <32 x i1> %a_cmp to i32
%all_zero = icmp eq i32 %cmp_result, 0
ret i1 %all_zero
}

0 comments on commit 901e5a7

Please sign in to comment.