diff --git a/llvm/test/CodeGen/X86/bitcast-and-setcc-256.ll b/llvm/test/CodeGen/X86/bitcast-and-setcc-256.ll index 2e6501ef1c772..2ff9dd4d94242 100644 --- a/llvm/test/CodeGen/X86/bitcast-and-setcc-256.ll +++ b/llvm/test/CodeGen/X86/bitcast-and-setcc-256.ll @@ -904,3 +904,93 @@ define i8 @v4i32_concat_undef(<4 x i32> %vec) { %res = bitcast <8 x i1> %insertvec to i8 ret i8 %res } + +define i8 @v2i64_concat_undef(<2 x i64> %vec) { +; SSE2-SSSE3-LABEL: v2i64_concat_undef: +; SSE2-SSSE3: # %bb.0: +; SSE2-SSSE3-NEXT: pxor %xmm1, %xmm1 +; SSE2-SSSE3-NEXT: pcmpeqd %xmm0, %xmm1 +; SSE2-SSSE3-NEXT: pshufd {{.*#+}} xmm0 = xmm1[1,3,3,2] +; SSE2-SSSE3-NEXT: pshufd {{.*#+}} xmm1 = xmm1[0,2,2,3] +; SSE2-SSSE3-NEXT: pand %xmm0, %xmm1 +; SSE2-SSSE3-NEXT: pshuflw {{.*#+}} xmm0 = xmm1[0,2,2,3,4,5,6,7] +; SSE2-SSSE3-NEXT: psllw $15, %xmm0 +; SSE2-SSSE3-NEXT: packsswb %xmm0, %xmm0 +; SSE2-SSSE3-NEXT: pmovmskb %xmm0, %eax +; SSE2-SSSE3-NEXT: # kill: def $al killed $al killed $eax +; SSE2-SSSE3-NEXT: retq +; +; AVX12-LABEL: v2i64_concat_undef: +; AVX12: # %bb.0: +; AVX12-NEXT: vpxor %xmm1, %xmm1, %xmm1 +; AVX12-NEXT: vpcmpeqq %xmm1, %xmm0, %xmm0 +; AVX12-NEXT: vpackssdw %xmm0, %xmm0, %xmm0 +; AVX12-NEXT: vpackssdw %xmm0, %xmm0, %xmm0 +; AVX12-NEXT: vpsllw $15, %xmm0, %xmm0 +; AVX12-NEXT: vpacksswb %xmm0, %xmm0, %xmm0 +; AVX12-NEXT: vpmovmskb %xmm0, %eax +; AVX12-NEXT: # kill: def $al killed $al killed $eax +; AVX12-NEXT: retq +; +; AVX512F-LABEL: v2i64_concat_undef: +; AVX512F: # %bb.0: +; AVX512F-NEXT: vptestnmq %xmm0, %xmm0, %k0 +; AVX512F-NEXT: kmovw %k0, %eax +; AVX512F-NEXT: # kill: def $al killed $al killed $eax +; AVX512F-NEXT: retq +; +; AVX512BW-LABEL: v2i64_concat_undef: +; AVX512BW: # %bb.0: +; AVX512BW-NEXT: vptestnmq %xmm0, %xmm0, %k0 +; AVX512BW-NEXT: kmovd %k0, %eax +; AVX512BW-NEXT: # kill: def $al killed $al killed $eax +; AVX512BW-NEXT: retq + %tobool = icmp eq <2 x i64> %vec, zeroinitializer + %insertvec = shufflevector <2 x i1> %tobool, <2 x i1> poison, <8 x i32> + %res = bitcast <8 x i1> %insertvec to i8 + ret i8 %res +} + +define i8 @v4f64_concat_undef(<4 x double> %vec) { +; SSE2-SSSE3-LABEL: v4f64_concat_undef: +; SSE2-SSSE3: # %bb.0: +; SSE2-SSSE3-NEXT: xorpd %xmm2, %xmm2 +; SSE2-SSSE3-NEXT: xorpd %xmm3, %xmm3 +; SSE2-SSSE3-NEXT: cmpltpd %xmm1, %xmm3 +; SSE2-SSSE3-NEXT: cmpltpd %xmm0, %xmm2 +; SSE2-SSSE3-NEXT: packssdw %xmm3, %xmm2 +; SSE2-SSSE3-NEXT: movmskps %xmm2, %eax +; SSE2-SSSE3-NEXT: # kill: def $al killed $al killed $eax +; SSE2-SSSE3-NEXT: retq +; +; AVX12-LABEL: v4f64_concat_undef: +; AVX12: # %bb.0: +; AVX12-NEXT: vxorpd %xmm1, %xmm1, %xmm1 +; AVX12-NEXT: vcmpltpd %ymm0, %ymm1, %ymm0 +; AVX12-NEXT: vmovmskpd %ymm0, %eax +; AVX12-NEXT: # kill: def $al killed $al killed $eax +; AVX12-NEXT: vzeroupper +; AVX12-NEXT: retq +; +; AVX512F-LABEL: v4f64_concat_undef: +; AVX512F: # %bb.0: +; AVX512F-NEXT: vxorpd %xmm1, %xmm1, %xmm1 +; AVX512F-NEXT: vcmpltpd %ymm0, %ymm1, %k0 +; AVX512F-NEXT: kmovw %k0, %eax +; AVX512F-NEXT: # kill: def $al killed $al killed $eax +; AVX512F-NEXT: vzeroupper +; AVX512F-NEXT: retq +; +; AVX512BW-LABEL: v4f64_concat_undef: +; AVX512BW: # %bb.0: +; AVX512BW-NEXT: vxorpd %xmm1, %xmm1, %xmm1 +; AVX512BW-NEXT: vcmpltpd %ymm0, %ymm1, %k0 +; AVX512BW-NEXT: kmovd %k0, %eax +; AVX512BW-NEXT: # kill: def $al killed $al killed $eax +; AVX512BW-NEXT: vzeroupper +; AVX512BW-NEXT: retq + %tobool = fcmp ogt <4 x double> %vec, zeroinitializer + %insertvec = shufflevector <4 x i1> %tobool, <4 x i1> poison, <8 x i32> + %res = bitcast <8 x i1> %insertvec to i8 + ret i8 %res +}