diff --git a/llvm/test/CodeGen/AArch64/neon-extadd-extract.ll b/llvm/test/CodeGen/AArch64/neon-extadd-extract.ll new file mode 100644 index 0000000000000..4fff9862b4950 --- /dev/null +++ b/llvm/test/CodeGen/AArch64/neon-extadd-extract.ll @@ -0,0 +1,538 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2 +; RUN: llc < %s -mtriple aarch64-none-eabi -o - | FileCheck %s + +define <4 x i16> @addls_v8i8_0(<8 x i8> %s0, <8 x i8> %s1) { +; CHECK-LABEL: addls_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v0.8h, v0.8b, #0 +; CHECK-NEXT: sshll v1.8h, v1.8b, #0 +; CHECK-NEXT: add v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s0s = sext <8 x i8> %s0 to <8 x i16> + %s1s = sext <8 x i8> %s1 to <8 x i16> + %t0 = shufflevector <8 x i16> %s0s, <8 x i16> poison, <4 x i32> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = add <4 x i16> %t0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @addws_v8i8_0(<4 x i16> %s0, <8 x i8> %s1) { +; CHECK-LABEL: addws_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v1.8h, v1.8b, #0 +; CHECK-NEXT: add v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s1s = sext <8 x i8> %s1 to <8 x i16> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = add <4 x i16> %s0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @addlu_v8i8_0(<8 x i8> %s0, <8 x i8> %s1) { +; CHECK-LABEL: addlu_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v0.8h, v0.8b, #0 +; CHECK-NEXT: ushll v1.8h, v1.8b, #0 +; CHECK-NEXT: add v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s0s = zext <8 x i8> %s0 to <8 x i16> + %s1s = zext <8 x i8> %s1 to <8 x i16> + %t0 = shufflevector <8 x i16> %s0s, <8 x i16> poison, <4 x i32> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = add <4 x i16> %t0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @addwu_v8i8_0(<4 x i16> %s0, <8 x i8> %s1) { +; CHECK-LABEL: addwu_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v1.8h, v1.8b, #0 +; CHECK-NEXT: add v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s1s = zext <8 x i8> %s1 to <8 x i16> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = add <4 x i16> %s0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @subls_v8i8_0(<8 x i8> %s0, <8 x i8> %s1) { +; CHECK-LABEL: subls_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v0.8h, v0.8b, #0 +; CHECK-NEXT: sshll v1.8h, v1.8b, #0 +; CHECK-NEXT: sub v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s0s = sext <8 x i8> %s0 to <8 x i16> + %s1s = sext <8 x i8> %s1 to <8 x i16> + %t0 = shufflevector <8 x i16> %s0s, <8 x i16> poison, <4 x i32> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = sub <4 x i16> %t0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @subws_v8i8_0(<4 x i16> %s0, <8 x i8> %s1) { +; CHECK-LABEL: subws_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v1.8h, v1.8b, #0 +; CHECK-NEXT: sub v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s1s = sext <8 x i8> %s1 to <8 x i16> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = sub <4 x i16> %s0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @sublu_v8i8_0(<8 x i8> %s0, <8 x i8> %s1) { +; CHECK-LABEL: sublu_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v0.8h, v0.8b, #0 +; CHECK-NEXT: ushll v1.8h, v1.8b, #0 +; CHECK-NEXT: sub v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s0s = zext <8 x i8> %s0 to <8 x i16> + %s1s = zext <8 x i8> %s1 to <8 x i16> + %t0 = shufflevector <8 x i16> %s0s, <8 x i16> poison, <4 x i32> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = sub <4 x i16> %t0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @subwu_v8i8_0(<4 x i16> %s0, <8 x i8> %s1) { +; CHECK-LABEL: subwu_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v1.8h, v1.8b, #0 +; CHECK-NEXT: sub v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s1s = zext <8 x i8> %s1 to <8 x i16> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = sub <4 x i16> %s0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @mulls_v8i8_0(<8 x i8> %s0, <8 x i8> %s1) { +; CHECK-LABEL: mulls_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v0.8h, v0.8b, #0 +; CHECK-NEXT: sshll v1.8h, v1.8b, #0 +; CHECK-NEXT: mul v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s0s = sext <8 x i8> %s0 to <8 x i16> + %s1s = sext <8 x i8> %s1 to <8 x i16> + %t0 = shufflevector <8 x i16> %s0s, <8 x i16> poison, <4 x i32> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = mul <4 x i16> %t0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @mulws_v8i8_0(<4 x i16> %s0, <8 x i8> %s1) { +; CHECK-LABEL: mulws_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v1.8h, v1.8b, #0 +; CHECK-NEXT: mul v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s1s = sext <8 x i8> %s1 to <8 x i16> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = mul <4 x i16> %s0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @mullu_v8i8_0(<8 x i8> %s0, <8 x i8> %s1) { +; CHECK-LABEL: mullu_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v0.8h, v0.8b, #0 +; CHECK-NEXT: ushll v1.8h, v1.8b, #0 +; CHECK-NEXT: mul v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s0s = zext <8 x i8> %s0 to <8 x i16> + %s1s = zext <8 x i8> %s1 to <8 x i16> + %t0 = shufflevector <8 x i16> %s0s, <8 x i16> poison, <4 x i32> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = mul <4 x i16> %t0, %t1 + ret <4 x i16> %m +} + +define <4 x i16> @mulwu_v8i8_0(<4 x i16> %s0, <8 x i8> %s1) { +; CHECK-LABEL: mulwu_v8i8_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v1.8h, v1.8b, #0 +; CHECK-NEXT: mul v0.4h, v0.4h, v1.4h +; CHECK-NEXT: ret +entry: + %s1s = zext <8 x i8> %s1 to <8 x i16> + %t1 = shufflevector <8 x i16> %s1s, <8 x i16> poison, <4 x i32> + %m = mul <4 x i16> %s0, %t1 + ret <4 x i16> %m +} + +define <2 x i32> @addls_v4i16_0(<4 x i16> %s0, <4 x i16> %s1) { +; CHECK-LABEL: addls_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v0.4s, v0.4h, #0 +; CHECK-NEXT: sshll v1.4s, v1.4h, #0 +; CHECK-NEXT: add v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s0s = sext <4 x i16> %s0 to <4 x i32> + %s1s = sext <4 x i16> %s1 to <4 x i32> + %t0 = shufflevector <4 x i32> %s0s, <4 x i32> poison, <2 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = add <2 x i32> %t0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @addws_v4i16_0(<2 x i32> %s0, <4 x i16> %s1) { +; CHECK-LABEL: addws_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v1.4s, v1.4h, #0 +; CHECK-NEXT: add v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s1s = sext <4 x i16> %s1 to <4 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = add <2 x i32> %s0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @addlu_v4i16_0(<4 x i16> %s0, <4 x i16> %s1) { +; CHECK-LABEL: addlu_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v0.4s, v0.4h, #0 +; CHECK-NEXT: ushll v1.4s, v1.4h, #0 +; CHECK-NEXT: add v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s0s = zext <4 x i16> %s0 to <4 x i32> + %s1s = zext <4 x i16> %s1 to <4 x i32> + %t0 = shufflevector <4 x i32> %s0s, <4 x i32> poison, <2 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = add <2 x i32> %t0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @addwu_v4i16_0(<2 x i32> %s0, <4 x i16> %s1) { +; CHECK-LABEL: addwu_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v1.4s, v1.4h, #0 +; CHECK-NEXT: add v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s1s = zext <4 x i16> %s1 to <4 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = add <2 x i32> %s0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @subls_v4i16_0(<4 x i16> %s0, <4 x i16> %s1) { +; CHECK-LABEL: subls_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v0.4s, v0.4h, #0 +; CHECK-NEXT: sshll v1.4s, v1.4h, #0 +; CHECK-NEXT: sub v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s0s = sext <4 x i16> %s0 to <4 x i32> + %s1s = sext <4 x i16> %s1 to <4 x i32> + %t0 = shufflevector <4 x i32> %s0s, <4 x i32> poison, <2 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = sub <2 x i32> %t0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @subws_v4i16_0(<2 x i32> %s0, <4 x i16> %s1) { +; CHECK-LABEL: subws_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v1.4s, v1.4h, #0 +; CHECK-NEXT: sub v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s1s = sext <4 x i16> %s1 to <4 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = sub <2 x i32> %s0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @sublu_v4i16_0(<4 x i16> %s0, <4 x i16> %s1) { +; CHECK-LABEL: sublu_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v0.4s, v0.4h, #0 +; CHECK-NEXT: ushll v1.4s, v1.4h, #0 +; CHECK-NEXT: sub v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s0s = zext <4 x i16> %s0 to <4 x i32> + %s1s = zext <4 x i16> %s1 to <4 x i32> + %t0 = shufflevector <4 x i32> %s0s, <4 x i32> poison, <2 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = sub <2 x i32> %t0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @subwu_v4i16_0(<2 x i32> %s0, <4 x i16> %s1) { +; CHECK-LABEL: subwu_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v1.4s, v1.4h, #0 +; CHECK-NEXT: sub v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s1s = zext <4 x i16> %s1 to <4 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = sub <2 x i32> %s0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @mulls_v4i16_0(<4 x i16> %s0, <4 x i16> %s1) { +; CHECK-LABEL: mulls_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v0.4s, v0.4h, #0 +; CHECK-NEXT: sshll v1.4s, v1.4h, #0 +; CHECK-NEXT: mul v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s0s = sext <4 x i16> %s0 to <4 x i32> + %s1s = sext <4 x i16> %s1 to <4 x i32> + %t0 = shufflevector <4 x i32> %s0s, <4 x i32> poison, <2 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = mul <2 x i32> %t0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @mulws_v4i16_0(<2 x i32> %s0, <4 x i16> %s1) { +; CHECK-LABEL: mulws_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v1.4s, v1.4h, #0 +; CHECK-NEXT: mul v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s1s = sext <4 x i16> %s1 to <4 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = mul <2 x i32> %s0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @mullu_v4i16_0(<4 x i16> %s0, <4 x i16> %s1) { +; CHECK-LABEL: mullu_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v0.4s, v0.4h, #0 +; CHECK-NEXT: ushll v1.4s, v1.4h, #0 +; CHECK-NEXT: mul v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s0s = zext <4 x i16> %s0 to <4 x i32> + %s1s = zext <4 x i16> %s1 to <4 x i32> + %t0 = shufflevector <4 x i32> %s0s, <4 x i32> poison, <2 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = mul <2 x i32> %t0, %t1 + ret <2 x i32> %m +} + +define <2 x i32> @mulwu_v4i16_0(<2 x i32> %s0, <4 x i16> %s1) { +; CHECK-LABEL: mulwu_v4i16_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v1.4s, v1.4h, #0 +; CHECK-NEXT: mul v0.2s, v0.2s, v1.2s +; CHECK-NEXT: ret +entry: + %s1s = zext <4 x i16> %s1 to <4 x i32> + %t1 = shufflevector <4 x i32> %s1s, <4 x i32> poison, <2 x i32> + %m = mul <2 x i32> %s0, %t1 + ret <2 x i32> %m +} + +define <1 x i64> @addls_v2i32_0(<2 x i32> %s0, <2 x i32> %s1) { +; CHECK-LABEL: addls_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v0.2d, v0.2s, #0 +; CHECK-NEXT: sshll v1.2d, v1.2s, #0 +; CHECK-NEXT: add d0, d0, d1 +; CHECK-NEXT: ret +entry: + %s0s = sext <2 x i32> %s0 to <2 x i64> + %s1s = sext <2 x i32> %s1 to <2 x i64> + %t0 = shufflevector <2 x i64> %s0s, <2 x i64> poison, <1 x i32> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = add <1 x i64> %t0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @addws_v2i32_0(<1 x i64> %s0, <2 x i32> %s1) { +; CHECK-LABEL: addws_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v1.2d, v1.2s, #0 +; CHECK-NEXT: add d0, d0, d1 +; CHECK-NEXT: ret +entry: + %s1s = sext <2 x i32> %s1 to <2 x i64> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = add <1 x i64> %s0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @addlu_v2i32_0(<2 x i32> %s0, <2 x i32> %s1) { +; CHECK-LABEL: addlu_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v0.2d, v0.2s, #0 +; CHECK-NEXT: ushll v1.2d, v1.2s, #0 +; CHECK-NEXT: add d0, d0, d1 +; CHECK-NEXT: ret +entry: + %s0s = zext <2 x i32> %s0 to <2 x i64> + %s1s = zext <2 x i32> %s1 to <2 x i64> + %t0 = shufflevector <2 x i64> %s0s, <2 x i64> poison, <1 x i32> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = add <1 x i64> %t0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @addwu_v2i32_0(<1 x i64> %s0, <2 x i32> %s1) { +; CHECK-LABEL: addwu_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v1.2d, v1.2s, #0 +; CHECK-NEXT: add d0, d0, d1 +; CHECK-NEXT: ret +entry: + %s1s = zext <2 x i32> %s1 to <2 x i64> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = add <1 x i64> %s0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @subls_v2i32_0(<2 x i32> %s0, <2 x i32> %s1) { +; CHECK-LABEL: subls_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v0.2d, v0.2s, #0 +; CHECK-NEXT: sshll v1.2d, v1.2s, #0 +; CHECK-NEXT: sub d0, d0, d1 +; CHECK-NEXT: ret +entry: + %s0s = sext <2 x i32> %s0 to <2 x i64> + %s1s = sext <2 x i32> %s1 to <2 x i64> + %t0 = shufflevector <2 x i64> %s0s, <2 x i64> poison, <1 x i32> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = sub <1 x i64> %t0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @subws_v2i32_0(<1 x i64> %s0, <2 x i32> %s1) { +; CHECK-LABEL: subws_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v1.2d, v1.2s, #0 +; CHECK-NEXT: sub d0, d0, d1 +; CHECK-NEXT: ret +entry: + %s1s = sext <2 x i32> %s1 to <2 x i64> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = sub <1 x i64> %s0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @sublu_v2i32_0(<2 x i32> %s0, <2 x i32> %s1) { +; CHECK-LABEL: sublu_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v0.2d, v0.2s, #0 +; CHECK-NEXT: ushll v1.2d, v1.2s, #0 +; CHECK-NEXT: sub d0, d0, d1 +; CHECK-NEXT: ret +entry: + %s0s = zext <2 x i32> %s0 to <2 x i64> + %s1s = zext <2 x i32> %s1 to <2 x i64> + %t0 = shufflevector <2 x i64> %s0s, <2 x i64> poison, <1 x i32> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = sub <1 x i64> %t0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @subwu_v2i32_0(<1 x i64> %s0, <2 x i32> %s1) { +; CHECK-LABEL: subwu_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v1.2d, v1.2s, #0 +; CHECK-NEXT: sub d0, d0, d1 +; CHECK-NEXT: ret +entry: + %s1s = zext <2 x i32> %s1 to <2 x i64> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = sub <1 x i64> %s0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @mulls_v2i32_0(<2 x i32> %s0, <2 x i32> %s1) { +; CHECK-LABEL: mulls_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v0.2d, v0.2s, #0 +; CHECK-NEXT: sshll v1.2d, v1.2s, #0 +; CHECK-NEXT: fmov x9, d0 +; CHECK-NEXT: fmov x8, d1 +; CHECK-NEXT: smull x8, w9, w8 +; CHECK-NEXT: fmov d0, x8 +; CHECK-NEXT: ret +entry: + %s0s = sext <2 x i32> %s0 to <2 x i64> + %s1s = sext <2 x i32> %s1 to <2 x i64> + %t0 = shufflevector <2 x i64> %s0s, <2 x i64> poison, <1 x i32> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = mul <1 x i64> %t0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @mulws_v2i32_0(<1 x i64> %s0, <2 x i32> %s1) { +; CHECK-LABEL: mulws_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: sshll v1.2d, v1.2s, #0 +; CHECK-NEXT: // kill: def $d0 killed $d0 def $q0 +; CHECK-NEXT: fmov x8, d0 +; CHECK-NEXT: fmov x9, d1 +; CHECK-NEXT: mul x8, x8, x9 +; CHECK-NEXT: fmov d0, x8 +; CHECK-NEXT: ret +entry: + %s1s = sext <2 x i32> %s1 to <2 x i64> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = mul <1 x i64> %s0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @mullu_v2i32_0(<2 x i32> %s0, <2 x i32> %s1) { +; CHECK-LABEL: mullu_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v0.2d, v0.2s, #0 +; CHECK-NEXT: ushll v1.2d, v1.2s, #0 +; CHECK-NEXT: fmov x9, d0 +; CHECK-NEXT: fmov x8, d1 +; CHECK-NEXT: umull x8, w9, w8 +; CHECK-NEXT: fmov d0, x8 +; CHECK-NEXT: ret +entry: + %s0s = zext <2 x i32> %s0 to <2 x i64> + %s1s = zext <2 x i32> %s1 to <2 x i64> + %t0 = shufflevector <2 x i64> %s0s, <2 x i64> poison, <1 x i32> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = mul <1 x i64> %t0, %t1 + ret <1 x i64> %m +} + +define <1 x i64> @mulwu_v2i32_0(<1 x i64> %s0, <2 x i32> %s1) { +; CHECK-LABEL: mulwu_v2i32_0: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: ushll v1.2d, v1.2s, #0 +; CHECK-NEXT: // kill: def $d0 killed $d0 def $q0 +; CHECK-NEXT: fmov x8, d0 +; CHECK-NEXT: fmov x9, d1 +; CHECK-NEXT: mul x8, x8, x9 +; CHECK-NEXT: fmov d0, x8 +; CHECK-NEXT: ret +entry: + %s1s = zext <2 x i32> %s1 to <2 x i64> + %t1 = shufflevector <2 x i64> %s1s, <2 x i64> poison, <1 x i32> + %m = mul <1 x i64> %s0, %t1 + ret <1 x i64> %m +}