-
Notifications
You must be signed in to change notification settings - Fork 15.1k
ARM: Add more ABIs to llvm.sincos test #166264
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Merged
Merged
Conversation
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Make sure the iOS with/without sincos_stret are tested
This stack of pull requests is managed by Graphite. Learn more about stacking. |
|
@llvm/pr-subscribers-backend-arm Author: Matt Arsenault (arsenm) ChangesMake sure the iOS with/without sincos_stret are tested Patch is 32.88 KiB, truncated to 20.00 KiB below, full version: https://github.com/llvm/llvm-project/pull/166264.diff 1 Files Affected:
diff --git a/llvm/test/CodeGen/ARM/llvm.sincos.ll b/llvm/test/CodeGen/ARM/llvm.sincos.ll
index 9628405df6bcb..0c2263ee9acbf 100644
--- a/llvm/test/CodeGen/ARM/llvm.sincos.ll
+++ b/llvm/test/CodeGen/ARM/llvm.sincos.ll
@@ -1,223 +1,783 @@
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2
-; RUN: llc -mtriple=thumbv7-gnu-linux < %s | FileCheck -check-prefixes=CHECK %s
+; RUN: llc -mtriple=thumbv7-gnu-linux < %s | FileCheck -check-prefix=GNU %s
+; RUN: llc -mtriple=armv7-linux-gnueabi -mcpu=cortex-a8 < %s | FileCheck -check-prefix=GNUEABI %s
+; RUN: llc -mtriple=armv7-apple-ios6 -mcpu=cortex-a8 < %s | FileCheck -check-prefixes=IOS,IOS-NO-STRET %s
+; RUN: llc -mtriple=armv7-apple-ios7 -mcpu=cortex-a8 < %s | FileCheck -check-prefixes=IOS,IOS-WITH-STRET %s
define { half, half } @test_sincos_f16(half %a) {
-; CHECK-LABEL: test_sincos_f16:
-; CHECK: @ %bb.0:
-; CHECK-NEXT: push {r4, lr}
-; CHECK-NEXT: sub sp, #8
-; CHECK-NEXT: bl __gnu_h2f_ieee
-; CHECK-NEXT: add r1, sp, #4
-; CHECK-NEXT: mov r2, sp
-; CHECK-NEXT: bl sincosf
-; CHECK-NEXT: ldr r0, [sp, #4]
-; CHECK-NEXT: bl __gnu_f2h_ieee
-; CHECK-NEXT: mov r4, r0
-; CHECK-NEXT: ldr r0, [sp]
-; CHECK-NEXT: bl __gnu_f2h_ieee
-; CHECK-NEXT: mov r1, r0
-; CHECK-NEXT: mov r0, r4
-; CHECK-NEXT: add sp, #8
-; CHECK-NEXT: pop {r4, pc}
+; GNU-LABEL: test_sincos_f16:
+; GNU: @ %bb.0:
+; GNU-NEXT: push {r4, lr}
+; GNU-NEXT: sub sp, #8
+; GNU-NEXT: bl __gnu_h2f_ieee
+; GNU-NEXT: add r1, sp, #4
+; GNU-NEXT: mov r2, sp
+; GNU-NEXT: bl sincosf
+; GNU-NEXT: ldr r0, [sp, #4]
+; GNU-NEXT: bl __gnu_f2h_ieee
+; GNU-NEXT: mov r4, r0
+; GNU-NEXT: ldr r0, [sp]
+; GNU-NEXT: bl __gnu_f2h_ieee
+; GNU-NEXT: mov r1, r0
+; GNU-NEXT: mov r0, r4
+; GNU-NEXT: add sp, #8
+; GNU-NEXT: pop {r4, pc}
+;
+; GNUEABI-LABEL: test_sincos_f16:
+; GNUEABI: @ %bb.0:
+; GNUEABI-NEXT: .save {r4, lr}
+; GNUEABI-NEXT: push {r4, lr}
+; GNUEABI-NEXT: .pad #8
+; GNUEABI-NEXT: sub sp, sp, #8
+; GNUEABI-NEXT: bl __gnu_h2f_ieee
+; GNUEABI-NEXT: add r1, sp, #4
+; GNUEABI-NEXT: mov r2, sp
+; GNUEABI-NEXT: bl sincosf
+; GNUEABI-NEXT: ldr r0, [sp, #4]
+; GNUEABI-NEXT: bl __gnu_f2h_ieee
+; GNUEABI-NEXT: mov r4, r0
+; GNUEABI-NEXT: ldr r0, [sp]
+; GNUEABI-NEXT: bl __gnu_f2h_ieee
+; GNUEABI-NEXT: mov r1, r0
+; GNUEABI-NEXT: mov r0, r4
+; GNUEABI-NEXT: add sp, sp, #8
+; GNUEABI-NEXT: pop {r4, pc}
+;
+; IOS-NO-STRET-LABEL: test_sincos_f16:
+; IOS-NO-STRET: @ %bb.0:
+; IOS-NO-STRET-NEXT: push {r4, r5, lr}
+; IOS-NO-STRET-NEXT: bl ___extendhfsf2
+; IOS-NO-STRET-NEXT: mov r4, r0
+; IOS-NO-STRET-NEXT: bl _sinf
+; IOS-NO-STRET-NEXT: bl ___truncsfhf2
+; IOS-NO-STRET-NEXT: mov r5, r0
+; IOS-NO-STRET-NEXT: mov r0, r4
+; IOS-NO-STRET-NEXT: bl _cosf
+; IOS-NO-STRET-NEXT: bl ___truncsfhf2
+; IOS-NO-STRET-NEXT: mov r1, r0
+; IOS-NO-STRET-NEXT: mov r0, r5
+; IOS-NO-STRET-NEXT: pop {r4, r5, pc}
+;
+; IOS-WITH-STRET-LABEL: test_sincos_f16:
+; IOS-WITH-STRET: @ %bb.0:
+; IOS-WITH-STRET-NEXT: push {r4, r5, lr}
+; IOS-WITH-STRET-NEXT: sub sp, sp, #8
+; IOS-WITH-STRET-NEXT: bl ___extendhfsf2
+; IOS-WITH-STRET-NEXT: mov r1, r0
+; IOS-WITH-STRET-NEXT: mov r0, sp
+; IOS-WITH-STRET-NEXT: bl ___sincosf_stret
+; IOS-WITH-STRET-NEXT: ldm sp, {r0, r4}
+; IOS-WITH-STRET-NEXT: bl ___truncsfhf2
+; IOS-WITH-STRET-NEXT: mov r5, r0
+; IOS-WITH-STRET-NEXT: mov r0, r4
+; IOS-WITH-STRET-NEXT: bl ___truncsfhf2
+; IOS-WITH-STRET-NEXT: mov r1, r0
+; IOS-WITH-STRET-NEXT: mov r0, r5
+; IOS-WITH-STRET-NEXT: add sp, sp, #8
+; IOS-WITH-STRET-NEXT: pop {r4, r5, pc}
%result = call { half, half } @llvm.sincos.f16(half %a)
ret { half, half } %result
}
define half @test_sincos_f16_only_use_sin(half %a) {
-; CHECK-LABEL: test_sincos_f16_only_use_sin:
-; CHECK: @ %bb.0:
-; CHECK-NEXT: push {r7, lr}
-; CHECK-NEXT: sub sp, #8
-; CHECK-NEXT: bl __gnu_h2f_ieee
-; CHECK-NEXT: add r1, sp, #4
-; CHECK-NEXT: mov r2, sp
-; CHECK-NEXT: bl sincosf
-; CHECK-NEXT: ldr r0, [sp, #4]
-; CHECK-NEXT: bl __gnu_f2h_ieee
-; CHECK-NEXT: add sp, #8
-; CHECK-NEXT: pop {r7, pc}
+; GNU-LABEL: test_sincos_f16_only_use_sin:
+; GNU: @ %bb.0:
+; GNU-NEXT: push {r7, lr}
+; GNU-NEXT: sub sp, #8
+; GNU-NEXT: bl __gnu_h2f_ieee
+; GNU-NEXT: add r1, sp, #4
+; GNU-NEXT: mov r2, sp
+; GNU-NEXT: bl sincosf
+; GNU-NEXT: ldr r0, [sp, #4]
+; GNU-NEXT: bl __gnu_f2h_ieee
+; GNU-NEXT: add sp, #8
+; GNU-NEXT: pop {r7, pc}
+;
+; GNUEABI-LABEL: test_sincos_f16_only_use_sin:
+; GNUEABI: @ %bb.0:
+; GNUEABI-NEXT: .save {r11, lr}
+; GNUEABI-NEXT: push {r11, lr}
+; GNUEABI-NEXT: .pad #8
+; GNUEABI-NEXT: sub sp, sp, #8
+; GNUEABI-NEXT: bl __gnu_h2f_ieee
+; GNUEABI-NEXT: add r1, sp, #4
+; GNUEABI-NEXT: mov r2, sp
+; GNUEABI-NEXT: bl sincosf
+; GNUEABI-NEXT: ldr r0, [sp, #4]
+; GNUEABI-NEXT: bl __gnu_f2h_ieee
+; GNUEABI-NEXT: add sp, sp, #8
+; GNUEABI-NEXT: pop {r11, pc}
+;
+; IOS-NO-STRET-LABEL: test_sincos_f16_only_use_sin:
+; IOS-NO-STRET: @ %bb.0:
+; IOS-NO-STRET-NEXT: push {lr}
+; IOS-NO-STRET-NEXT: bl ___extendhfsf2
+; IOS-NO-STRET-NEXT: bl _sinf
+; IOS-NO-STRET-NEXT: bl ___truncsfhf2
+; IOS-NO-STRET-NEXT: pop {lr}
+; IOS-NO-STRET-NEXT: bx lr
+;
+; IOS-WITH-STRET-LABEL: test_sincos_f16_only_use_sin:
+; IOS-WITH-STRET: @ %bb.0:
+; IOS-WITH-STRET-NEXT: push {lr}
+; IOS-WITH-STRET-NEXT: sub sp, sp, #8
+; IOS-WITH-STRET-NEXT: bl ___extendhfsf2
+; IOS-WITH-STRET-NEXT: mov r1, r0
+; IOS-WITH-STRET-NEXT: mov r0, sp
+; IOS-WITH-STRET-NEXT: bl ___sincosf_stret
+; IOS-WITH-STRET-NEXT: ldr r0, [sp]
+; IOS-WITH-STRET-NEXT: bl ___truncsfhf2
+; IOS-WITH-STRET-NEXT: add sp, sp, #8
+; IOS-WITH-STRET-NEXT: pop {lr}
+; IOS-WITH-STRET-NEXT: bx lr
%result = call { half, half } @llvm.sincos.f16(half %a)
%result.0 = extractvalue { half, half } %result, 0
ret half %result.0
}
define half @test_sincos_f16_only_use_cos(half %a) {
-; CHECK-LABEL: test_sincos_f16_only_use_cos:
-; CHECK: @ %bb.0:
-; CHECK-NEXT: push {r7, lr}
-; CHECK-NEXT: sub sp, #8
-; CHECK-NEXT: bl __gnu_h2f_ieee
-; CHECK-NEXT: add r1, sp, #4
-; CHECK-NEXT: mov r2, sp
-; CHECK-NEXT: bl sincosf
-; CHECK-NEXT: ldr r0, [sp]
-; CHECK-NEXT: bl __gnu_f2h_ieee
-; CHECK-NEXT: add sp, #8
-; CHECK-NEXT: pop {r7, pc}
+; GNU-LABEL: test_sincos_f16_only_use_cos:
+; GNU: @ %bb.0:
+; GNU-NEXT: push {r7, lr}
+; GNU-NEXT: sub sp, #8
+; GNU-NEXT: bl __gnu_h2f_ieee
+; GNU-NEXT: add r1, sp, #4
+; GNU-NEXT: mov r2, sp
+; GNU-NEXT: bl sincosf
+; GNU-NEXT: ldr r0, [sp]
+; GNU-NEXT: bl __gnu_f2h_ieee
+; GNU-NEXT: add sp, #8
+; GNU-NEXT: pop {r7, pc}
+;
+; GNUEABI-LABEL: test_sincos_f16_only_use_cos:
+; GNUEABI: @ %bb.0:
+; GNUEABI-NEXT: .save {r11, lr}
+; GNUEABI-NEXT: push {r11, lr}
+; GNUEABI-NEXT: .pad #8
+; GNUEABI-NEXT: sub sp, sp, #8
+; GNUEABI-NEXT: bl __gnu_h2f_ieee
+; GNUEABI-NEXT: add r1, sp, #4
+; GNUEABI-NEXT: mov r2, sp
+; GNUEABI-NEXT: bl sincosf
+; GNUEABI-NEXT: ldr r0, [sp]
+; GNUEABI-NEXT: bl __gnu_f2h_ieee
+; GNUEABI-NEXT: add sp, sp, #8
+; GNUEABI-NEXT: pop {r11, pc}
+;
+; IOS-NO-STRET-LABEL: test_sincos_f16_only_use_cos:
+; IOS-NO-STRET: @ %bb.0:
+; IOS-NO-STRET-NEXT: push {lr}
+; IOS-NO-STRET-NEXT: bl ___extendhfsf2
+; IOS-NO-STRET-NEXT: bl _cosf
+; IOS-NO-STRET-NEXT: bl ___truncsfhf2
+; IOS-NO-STRET-NEXT: pop {lr}
+; IOS-NO-STRET-NEXT: bx lr
+;
+; IOS-WITH-STRET-LABEL: test_sincos_f16_only_use_cos:
+; IOS-WITH-STRET: @ %bb.0:
+; IOS-WITH-STRET-NEXT: push {lr}
+; IOS-WITH-STRET-NEXT: sub sp, sp, #8
+; IOS-WITH-STRET-NEXT: bl ___extendhfsf2
+; IOS-WITH-STRET-NEXT: mov r1, r0
+; IOS-WITH-STRET-NEXT: mov r0, sp
+; IOS-WITH-STRET-NEXT: bl ___sincosf_stret
+; IOS-WITH-STRET-NEXT: ldr r0, [sp, #4]
+; IOS-WITH-STRET-NEXT: bl ___truncsfhf2
+; IOS-WITH-STRET-NEXT: add sp, sp, #8
+; IOS-WITH-STRET-NEXT: pop {lr}
+; IOS-WITH-STRET-NEXT: bx lr
%result = call { half, half } @llvm.sincos.f16(half %a)
%result.1 = extractvalue { half, half } %result, 1
ret half %result.1
}
define { <2 x half>, <2 x half> } @test_sincos_v2f16(<2 x half> %a) {
-; CHECK-LABEL: test_sincos_v2f16:
-; CHECK: @ %bb.0:
-; CHECK-NEXT: push {r4, lr}
-; CHECK-NEXT: vpush {d8}
-; CHECK-NEXT: sub sp, #24
-; CHECK-NEXT: mov r4, r0
-; CHECK-NEXT: mov r0, r1
-; CHECK-NEXT: bl __gnu_h2f_ieee
-; CHECK-NEXT: add r1, sp, #12
-; CHECK-NEXT: add r2, sp, #8
-; CHECK-NEXT: bl sincosf
-; CHECK-NEXT: mov r0, r4
-; CHECK-NEXT: bl __gnu_h2f_ieee
-; CHECK-NEXT: add r1, sp, #4
-; CHECK-NEXT: mov r2, sp
-; CHECK-NEXT: bl sincosf
-; CHECK-NEXT: ldr r0, [sp, #12]
-; CHECK-NEXT: bl __gnu_f2h_ieee
-; CHECK-NEXT: ldr r1, [sp, #4]
-; CHECK-NEXT: strh.w r0, [sp, #22]
-; CHECK-NEXT: mov r0, r1
-; CHECK-NEXT: bl __gnu_f2h_ieee
-; CHECK-NEXT: strh.w r0, [sp, #20]
-; CHECK-NEXT: add r0, sp, #20
-; CHECK-NEXT: vld1.32 {d8[0]}, [r0:32]
-; CHECK-NEXT: ldr r0, [sp, #8]
-; CHECK-NEXT: bl __gnu_f2h_ieee
-; CHECK-NEXT: ldr r1, [sp]
-; CHECK-NEXT: strh.w r0, [sp, #18]
-; CHECK-NEXT: mov r0, r1
-; CHECK-NEXT: bl __gnu_f2h_ieee
-; CHECK-NEXT: strh.w r0, [sp, #16]
-; CHECK-NEXT: add r0, sp, #16
-; CHECK-NEXT: vmovl.u16 q9, d8
-; CHECK-NEXT: vld1.32 {d16[0]}, [r0:32]
-; CHECK-NEXT: vmovl.u16 q8, d16
-; CHECK-NEXT: vmov.32 r0, d18[0]
-; CHECK-NEXT: vmov.32 r1, d18[1]
-; CHECK-NEXT: vmov.32 r2, d16[0]
-; CHECK-NEXT: vmov.32 r3, d16[1]
-; CHECK-NEXT: add sp, #24
-; CHECK-NEXT: vpop {d8}
-; CHECK-NEXT: pop {r4, pc}
+; GNU-LABEL: test_sincos_v2f16:
+; GNU: @ %bb.0:
+; GNU-NEXT: push {r4, lr}
+; GNU-NEXT: vpush {d8}
+; GNU-NEXT: sub sp, #24
+; GNU-NEXT: mov r4, r0
+; GNU-NEXT: mov r0, r1
+; GNU-NEXT: bl __gnu_h2f_ieee
+; GNU-NEXT: add r1, sp, #12
+; GNU-NEXT: add r2, sp, #8
+; GNU-NEXT: bl sincosf
+; GNU-NEXT: mov r0, r4
+; GNU-NEXT: bl __gnu_h2f_ieee
+; GNU-NEXT: add r1, sp, #4
+; GNU-NEXT: mov r2, sp
+; GNU-NEXT: bl sincosf
+; GNU-NEXT: ldr r0, [sp, #12]
+; GNU-NEXT: bl __gnu_f2h_ieee
+; GNU-NEXT: ldr r1, [sp, #4]
+; GNU-NEXT: strh.w r0, [sp, #22]
+; GNU-NEXT: mov r0, r1
+; GNU-NEXT: bl __gnu_f2h_ieee
+; GNU-NEXT: strh.w r0, [sp, #20]
+; GNU-NEXT: add r0, sp, #20
+; GNU-NEXT: vld1.32 {d8[0]}, [r0:32]
+; GNU-NEXT: ldr r0, [sp, #8]
+; GNU-NEXT: bl __gnu_f2h_ieee
+; GNU-NEXT: ldr r1, [sp]
+; GNU-NEXT: strh.w r0, [sp, #18]
+; GNU-NEXT: mov r0, r1
+; GNU-NEXT: bl __gnu_f2h_ieee
+; GNU-NEXT: strh.w r0, [sp, #16]
+; GNU-NEXT: add r0, sp, #16
+; GNU-NEXT: vmovl.u16 q9, d8
+; GNU-NEXT: vld1.32 {d16[0]}, [r0:32]
+; GNU-NEXT: vmovl.u16 q8, d16
+; GNU-NEXT: vmov.32 r0, d18[0]
+; GNU-NEXT: vmov.32 r1, d18[1]
+; GNU-NEXT: vmov.32 r2, d16[0]
+; GNU-NEXT: vmov.32 r3, d16[1]
+; GNU-NEXT: add sp, #24
+; GNU-NEXT: vpop {d8}
+; GNU-NEXT: pop {r4, pc}
+;
+; GNUEABI-LABEL: test_sincos_v2f16:
+; GNUEABI: @ %bb.0:
+; GNUEABI-NEXT: .save {r4, lr}
+; GNUEABI-NEXT: push {r4, lr}
+; GNUEABI-NEXT: .vsave {d8}
+; GNUEABI-NEXT: vpush {d8}
+; GNUEABI-NEXT: .pad #24
+; GNUEABI-NEXT: sub sp, sp, #24
+; GNUEABI-NEXT: mov r4, r0
+; GNUEABI-NEXT: mov r0, r1
+; GNUEABI-NEXT: bl __gnu_h2f_ieee
+; GNUEABI-NEXT: add r1, sp, #12
+; GNUEABI-NEXT: add r2, sp, #8
+; GNUEABI-NEXT: bl sincosf
+; GNUEABI-NEXT: mov r0, r4
+; GNUEABI-NEXT: bl __gnu_h2f_ieee
+; GNUEABI-NEXT: add r1, sp, #4
+; GNUEABI-NEXT: mov r2, sp
+; GNUEABI-NEXT: bl sincosf
+; GNUEABI-NEXT: ldr r0, [sp, #12]
+; GNUEABI-NEXT: bl __gnu_f2h_ieee
+; GNUEABI-NEXT: ldr r1, [sp, #4]
+; GNUEABI-NEXT: strh r0, [sp, #22]
+; GNUEABI-NEXT: mov r0, r1
+; GNUEABI-NEXT: bl __gnu_f2h_ieee
+; GNUEABI-NEXT: strh r0, [sp, #20]
+; GNUEABI-NEXT: add r0, sp, #20
+; GNUEABI-NEXT: vld1.32 {d8[0]}, [r0:32]
+; GNUEABI-NEXT: ldr r0, [sp, #8]
+; GNUEABI-NEXT: bl __gnu_f2h_ieee
+; GNUEABI-NEXT: ldr r1, [sp]
+; GNUEABI-NEXT: strh r0, [sp, #18]
+; GNUEABI-NEXT: mov r0, r1
+; GNUEABI-NEXT: bl __gnu_f2h_ieee
+; GNUEABI-NEXT: strh r0, [sp, #16]
+; GNUEABI-NEXT: add r0, sp, #16
+; GNUEABI-NEXT: vmovl.u16 q9, d8
+; GNUEABI-NEXT: vld1.32 {d16[0]}, [r0:32]
+; GNUEABI-NEXT: vmovl.u16 q8, d16
+; GNUEABI-NEXT: vmov.32 r0, d18[0]
+; GNUEABI-NEXT: vmov.32 r1, d18[1]
+; GNUEABI-NEXT: vmov.32 r2, d16[0]
+; GNUEABI-NEXT: vmov.32 r3, d16[1]
+; GNUEABI-NEXT: add sp, sp, #24
+; GNUEABI-NEXT: vpop {d8}
+; GNUEABI-NEXT: pop {r4, pc}
+;
+; IOS-NO-STRET-LABEL: test_sincos_v2f16:
+; IOS-NO-STRET: @ %bb.0:
+; IOS-NO-STRET-NEXT: push {r4, r5, lr}
+; IOS-NO-STRET-NEXT: vpush {d8}
+; IOS-NO-STRET-NEXT: sub sp, sp, #8
+; IOS-NO-STRET-NEXT: mov r5, r0
+; IOS-NO-STRET-NEXT: mov r0, r1
+; IOS-NO-STRET-NEXT: bl ___extendhfsf2
+; IOS-NO-STRET-NEXT: mov r4, r0
+; IOS-NO-STRET-NEXT: bl _sinf
+; IOS-NO-STRET-NEXT: bl ___truncsfhf2
+; IOS-NO-STRET-NEXT: strh r0, [sp, #6]
+; IOS-NO-STRET-NEXT: mov r0, r5
+; IOS-NO-STRET-NEXT: bl ___extendhfsf2
+; IOS-NO-STRET-NEXT: mov r5, r0
+; IOS-NO-STRET-NEXT: bl _sinf
+; IOS-NO-STRET-NEXT: bl ___truncsfhf2
+; IOS-NO-STRET-NEXT: strh r0, [sp, #4]
+; IOS-NO-STRET-NEXT: add r0, sp, #4
+; IOS-NO-STRET-NEXT: vld1.32 {d8[0]}, [r0:32]
+; IOS-NO-STRET-NEXT: mov r0, r4
+; IOS-NO-STRET-NEXT: bl _cosf
+; IOS-NO-STRET-NEXT: bl ___truncsfhf2
+; IOS-NO-STRET-NEXT: strh r0, [sp, #2]
+; IOS-NO-STRET-NEXT: mov r0, r5
+; IOS-NO-STRET-NEXT: bl _cosf
+; IOS-NO-STRET-NEXT: bl ___truncsfhf2
+; IOS-NO-STRET-NEXT: strh r0, [sp]
+; IOS-NO-STRET-NEXT: mov r0, sp
+; IOS-NO-STRET-NEXT: vld1.32 {d16[0]}, [r0:32]
+; IOS-NO-STRET-NEXT: vmovl.u16 q9, d8
+; IOS-NO-STRET-NEXT: vmovl.u16 q8, d16
+; IOS-NO-STRET-NEXT: vmov.32 r0, d18[0]
+; IOS-NO-STRET-NEXT: vmov.32 r1, d18[1]
+; IOS-NO-STRET-NEXT: vmov.32 r2, d16[0]
+; IOS-NO-STRET-NEXT: vmov.32 r3, d16[1]
+; IOS-NO-STRET-NEXT: add sp, sp, #8
+; IOS-NO-STRET-NEXT: vpop {d8}
+; IOS-NO-STRET-NEXT: pop {r4, r5, pc}
+;
+; IOS-WITH-STRET-LABEL: test_sincos_v2f16:
+; IOS-WITH-STRET: @ %bb.0:
+; IOS-WITH-STRET-NEXT: push {r4, r5, lr}
+; IOS-WITH-STRET-NEXT: vpush {d8}
+; IOS-WITH-STRET-NEXT: sub sp, sp, #24
+; IOS-WITH-STRET-NEXT: mov r4, r0
+; IOS-WITH-STRET-NEXT: mov r0, r1
+; IOS-WITH-STRET-NEXT: bl ___extendhfsf2
+; IOS-WITH-STRET-NEXT: mov r1, r0
+; IOS-WITH-STRET-NEXT: add r0, sp, #8
+; IOS-WITH-STRET-NEXT: bl ___sincosf_stret
+; IOS-WITH-STRET-NEXT: mov r0, r4
+; IOS-WITH-STRET-NEXT: bl ___extendhfsf2
+; IOS-WITH-STRET-NEXT: mov r1, r0
+; IOS-WITH-STRET-NEXT: mov r0, sp
+; IOS-WITH-STRET-NEXT: bl ___sincosf_stret
+; IOS-WITH-STRET-NEXT: ldr r0, [sp, #8]
+; IOS-WITH-STRET-NEXT: ldr r4, [sp, #12]
+; IOS-WITH-STRET-NEXT: bl ___truncsfhf2
+; IOS-WITH-STRET-NEXT: ldm sp, {r1, r5}
+; IOS-WITH-STRET-NEXT: strh r0, [sp, #22]
+; IOS-WITH-STRET-NEXT: mov r0, r1
+; IOS-WITH-STRET-NEXT: bl ___truncsfhf2
+; IOS-WITH-STRET-NEXT: strh r0, [sp, #20]
+; IOS-WITH-STRET-NEXT: add r0, sp, #20
+; IOS-WITH-STRET-NEXT: vld1.32 {d8[0]}, [r0:32]
+; IOS-WITH-STRET-NEXT: mov r0, r4
+; IOS-WITH-STRET-NEXT: bl ___truncsfhf2
+; IOS-WITH-STRET-NEXT: strh r0, [sp, #18]
+; IOS-WITH-STRET-NEXT: mov r0, r5
+; IOS-WITH-STRET-NEXT: bl ___truncsfhf2
+; IOS-WITH-STRET-NEXT: strh r0, [sp, #16]
+; IOS-WITH-STRET-NEXT: add r0, sp, #16
+; IOS-WITH-STRET-NEXT: vmovl.u16 q9, d8
+; IOS-WITH-STRET-NEXT: vld1.32 {d16[0]}, [r0:32]
+; IOS-WITH-STRET-NEXT: vmovl.u16 q8, d16
+; IOS-WITH-STRET-NEXT: vmov.32 r0, d18[0]
+; IOS-WITH-STRET-NEXT: vmov.32 r1, d18[1]
+; IOS-WITH-STRET-NEXT: vmov.32 r2, d16[0]
+; IOS-WITH-STRET-NEXT: vmov.32 r3, d16[1]
+; IOS-WITH-STRET-NEXT: add sp, sp, #24
+; IOS-WITH-STRET-NEXT: vpop {d8}
+; IOS-WITH-STRET-NEXT: pop {r4, r5, pc}
%result = call { <2 x half>, <2 x half> } @llvm.sincos.v2f16(<2 x half> %a)
ret { <2 x half>, <2 x half> } %result
}
define { float, float } @test_sincos_f32(float %a) {
-; CHECK-LABEL: test_sincos_f32:
-; CHECK: @ %bb.0:
-; CHECK-NEXT: push {r7, lr}
-; CHECK-NEXT: sub sp, #8
-; CHECK-NEXT: add r1, sp, #4
-; CHECK-NEXT: mov r2, sp
-; CHECK-NEXT: bl sincosf
-; CHECK-NEXT: ldrd r1, r0, [sp], #8
-; CHECK-NEXT: pop {r7, pc}
+; GNU-LABEL: test_sincos_f32:
+; GNU: @ %bb.0:
+; GNU-NEXT: push {r7, lr}
+; GNU-NEXT: sub sp, #8
+; GNU-NEXT: add r1, sp, #4
+; GNU-NEXT: mov r2, sp
+; GNU-NEXT: bl sincosf
+; GNU-NEXT: ldrd r1, r0, [sp], #8
+; GNU-NEXT: pop {r7, pc}
+;
+; GNUEABI-LABEL: test_sincos_f32:
+; GNUEABI: @ %bb.0:
+; GNUEABI-NEXT: .save {r11, lr}
+; GNUEABI-NEXT: push {r11, lr}
+; GNUEABI-NEXT: .pad #8
+; GNUEABI-NEXT: sub sp, sp, #8
+; GNUEABI-NEXT: add r1, sp, #4
+; GNUEABI-NEXT: mov r2, sp
+; GNUEABI-NEXT: bl sincosf
+; GNUEABI-NEXT: ldr r0, [sp, #4]
+; GNUEABI-NEXT: ldr r1, [sp], #8
+; GNUEABI-NEXT: pop {r11, pc}
+;
+; IOS-NO-STRET-LABEL: test_sincos_f32:
+; IOS-NO-STRET: @ %bb.0:
+; IOS-NO-STRET-NEXT: push {r4, r5, lr}
+; IOS-NO-STRET-NEXT: mov r4, r0
+; IOS-NO-STRET-NEXT: bl _sinf
+; IOS-NO-STRET-NEXT: mov r5, r0
+; IOS-NO-STRET-NEXT: mov r0, r4
+; IOS-NO-STRET-NEXT: bl _cosf
+; IOS-NO-STRET-NEXT: mov r1, r0
+; IOS-NO-STRET-NEXT: mov r0, r5
+; IOS-NO-STRET-NEXT: pop {r4, r5, pc}
+;
+; IOS-WITH-STRET-LABEL: test_sincos_f32:
+; IOS-WITH-STRET: @ %bb.0:
+; IOS-WITH-STRET-NEXT: push {lr}
+; IOS-WITH-STRET-NEXT: sub sp, sp, #8
+; IOS-WITH-STRET-NEXT: mov r1, r0
+; IOS-WITH-STRET-NEXT: mov r0, sp
+; IOS-WITH-STRET-NEXT: bl ___sincosf_stret
+; IOS-WITH-STRET-NEXT: pop {r0, r1}
+; IOS-WITH-STRET-NEXT: pop {lr}
+; IOS-WITH-STRET-NEXT: bx lr
%result = call { float, float } @llvm.sincos.f32(float %a)
ret { float, float } %result
}
define { <2 x float>, <2 x float> } @test_sincos_v2f32(<2 x float> %a) {
-; CHECK-LABEL: test_sincos_v2f32:
-; CHECK: @ %bb.0:
-; CHECK-NEXT: push {r7, lr}
-; CHECK-NEXT: vpush {d8}
-; CHECK-NEXT: sub sp, #16
-; CHECK-NEXT: vmov d8, r0, r1
-; CHECK-NEXT: add r1, sp, #4
-; CHECK-NEXT: mov r2, sp
-; CHECK-NEXT: vmov r0, s17
-; CHECK-NEXT: bl sincosf
-; CHECK-NEXT: vmov r0, s16
-; CHECK-NEXT: add r1, sp, #12
-; CHECK-NEXT: add r2, sp, #8
-; CHECK-NEXT: bl sincosf
-; CHECK-NEXT: vldr s1, [sp, #4]
-; CHECK-NEXT: vldr s3, [sp]
-; CHECK-NEXT: vldr s0, [sp, #12]
-; CHECK-NEXT: vldr s2, [sp, #8]
-; CHECK-NEXT: vmov r0, r1, d0
-; CHECK-NEXT: vmov r2, r3, d1
-; CHECK-NEXT: add sp, #16
-; CHECK-NEXT: vpop {d8}
-; CHECK-NEXT: pop {r7, pc}
+; GNU-LABEL: test_sincos_v2f32:
+; GNU: @ %bb.0:
+; GNU-NEXT: push {r7, lr}
+; GNU-NEXT: vpush {d8}
+; GNU-NEXT: sub sp, #16
+; GNU-NEXT: vmov d8, r0, r1
+; GNU-NEXT: add r1, sp, #4
+; GNU-NEXT: mov r2, sp
+; GNU-NEXT: vmov r0, s17
+; GNU-NEXT: bl sincosf
+; GNU-NEXT: vmov r0, s16
+; GNU-NEXT: add r1, sp, #12
+; GNU-NEXT: add r2, sp, #8
+; GNU-NEXT: bl sincosf
+; GNU-NEXT: vldr s1, [sp, #4]
+; GNU-NEXT: vldr s3, [sp]
+; GNU-NEXT: vldr s0, [sp, #12]
+; GNU-NEXT: vldr s2, [sp, #8]
+; GNU-NEXT: vmov r0, r1, d0
+; GNU-NEXT: vmov r2, r3, d1
+; GNU-NEXT: add sp, #16
+; GNU-NEXT: vpop {d8}
+; GNU-NEXT: pop {r7, pc}
+;
+; GNUEABI-LABEL: test_sincos_v2f32:
+; GNUEABI: @ %bb.0:
+; GNUEABI-NEXT: .save {r11, lr}
+; GNUEABI-NEXT: push {r11, lr}
+; GNUEABI-NEXT: .vsave {d8}
+; GNUEABI-NEXT: vpush {d8}
+; GNUEABI-NEXT: .pad #16
+; GNUEABI-NEXT: sub sp, sp, #16
+; GNUEABI-NEXT: vmov d8, r0, r1
+; GNUEABI-NEXT: add r1, sp, #4
+; GNUEABI-NEXT: mov r2, sp
+; GNUEABI-NEXT: vmov r0, s17
+; GNUEABI-NEXT: bl sincosf
+; GNUEABI-NEXT: vmov r0, s16
+; GNUEABI-NEXT: add r1, sp, #12
+; GNUEABI-NEXT: add r2, sp, #8
+; GNUEABI-NEXT: bl sincosf
+; GNUEABI-NEXT: vldr...
[truncated]
|
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Add this suggestion to a batch that can be applied as a single commit.
This suggestion is invalid because no changes were made to the code.
Suggestions cannot be applied while the pull request is closed.
Suggestions cannot be applied while viewing a subset of changes.
Only one suggestion per line can be applied in a batch.
Add this suggestion to a batch that can be applied as a single commit.
Applying suggestions on deleted lines is not supported.
You must change the existing code in this line in order to create a valid suggestion.
Outdated suggestions cannot be applied.
This suggestion has been applied or marked resolved.
Suggestions cannot be applied from pending reviews.
Suggestions cannot be applied on multi-line comments.
Suggestions cannot be applied while the pull request is queued to merge.
Suggestion cannot be applied right now. Please check back later.

Make sure the iOS with/without sincos_stret are tested