From 1617756558bc853baacb87ffa9fe7452ba0a3680 Mon Sep 17 00:00:00 2001 From: Simon Pilgrim Date: Fri, 14 Nov 2025 11:27:55 +0000 Subject: [PATCH] [clang][x86] AVX512FP16 constrained sqrt test coverage _mm_sqrt_sh / _mm512_sqrt_ph - these were missed from #167692 --- .../X86/avx512fp16-builtins-constrained.c | 85 +++++++++++++++++++ 1 file changed, 85 insertions(+) create mode 100644 clang/test/CodeGen/X86/avx512fp16-builtins-constrained.c diff --git a/clang/test/CodeGen/X86/avx512fp16-builtins-constrained.c b/clang/test/CodeGen/X86/avx512fp16-builtins-constrained.c new file mode 100644 index 0000000000000..cb029ccdcbf59 --- /dev/null +++ b/clang/test/CodeGen/X86/avx512fp16-builtins-constrained.c @@ -0,0 +1,85 @@ +// REQUIRES: x86-registered-target +// RUN: %clang_cc1 -x c -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -emit-llvm -o - -Wall -Werror | FileCheck %s --check-prefix=UNCONSTRAINED --check-prefix=COMMON +// RUN: %clang_cc1 -x c -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -ffp-exception-behavior=maytrap -DSTRICT=1 -emit-llvm -o - -Wall -Werror | FileCheck %s --check-prefix=CONSTRAINED --check-prefix=COMMON +// RUN: %clang_cc1 -x c -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -S -o - -Wall -Werror | FileCheck %s --check-prefix=CHECK-ASM --check-prefix=COMMON +// RUN: %clang_cc1 -x c -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -ffp-exception-behavior=maytrap -DSTRICT=1 -S -o - -Wall -Werror | FileCheck %s --check-prefix=CHECK-ASM --check-prefix=COMMON +// RUN: %clang_cc1 -x c++ -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -emit-llvm -o - -Wall -Werror | FileCheck %s --check-prefix=UNCONSTRAINED --check-prefix=COMMON +// RUN: %clang_cc1 -x c++ -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -ffp-exception-behavior=maytrap -DSTRICT=1 -emit-llvm -o - -Wall -Werror | FileCheck %s --check-prefix=CONSTRAINED --check-prefix=COMMON +// RUN: %clang_cc1 -x c++ -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -S -o - -Wall -Werror | FileCheck %s --check-prefix=CHECK-ASM --check-prefix=COMMON +// RUN: %clang_cc1 -x c++ -ffreestanding %s -triple=x86_64-unknown-linux-gnu -target-feature +avx512vl -target-feature +avx512fp16 -ffp-exception-behavior=maytrap -DSTRICT=1 -S -o - -Wall -Werror | FileCheck %s --check-prefix=CHECK-ASM --check-prefix=COMMON + +#ifdef STRICT +// Test that the constrained intrinsics are picking up the exception +// metadata from the AST instead of the global default from the command line. + +#pragma float_control(except, on) +#endif + + +#include + +__m128h test_mm_sqrt_sh(__m128h x, __m128h y) { + // COMMON-LABEL: test_mm_sqrt_sh + // UNCONSTRAINED: call {{.*}}half @llvm.sqrt.f16(half {{.*}}) + // CONSTRAINED: call {{.*}}half @llvm.experimental.constrained.sqrt.f16(half {{.*}}, metadata !{{.*}}) + // CHECK-ASM: vsqrtsh %xmm{{.*}}, + return _mm_sqrt_sh(x, y); +} + +__m128h test_mm_mask_sqrt_sh(__m128h __W, __mmask8 __U, __m128h __A, __m128h __B){ + // COMMON-LABEL: test_mm_mask_sqrt_sh + // COMMONIR: extractelement <8 x half> %{{.*}}, i64 0 + // UNCONSTRAINED: call {{.*}}half @llvm.sqrt.f16(half %{{.*}}) + // CONSTRAINED: call {{.*}}half @llvm.experimental.constrained.sqrt.f16(half %{{.*}}, metadata !{{.*}}) + // CHECK-ASM: vsqrtsh %xmm{{.*}}, + // COMMONIR-NEXT: extractelement <8 x half> %{{.*}}, i64 0 + // COMMONIR-NEXT: bitcast i8 %{{.*}} to <8 x i1> + // COMMONIR-NEXT: extractelement <8 x i1> %{{.*}}, i64 0 + // COMMONIR-NEXT: select i1 {{.*}}, half {{.*}}, half {{.*}} + // COMMONIR-NEXT: insertelement <8 x half> %{{.*}}, half {{.*}}, i64 0 + return _mm_mask_sqrt_sh(__W,__U,__A,__B); +} + +__m128h test_mm_maskz_sqrt_sh(__mmask8 __U, __m128h __A, __m128h __B){ + // COMMON-LABEL: test_mm_maskz_sqrt_sh + // COMMONIR: extractelement <2 x half> %{{.*}}, i64 0 + // UNCONSTRAINED: call {{.*}}half @llvm.sqrt.f16(half %{{.*}}) + // CONSTRAINED: call {{.*}}half @llvm.experimental.constrained.sqrt.f16(half %{{.*}}, metadata !{{.*}}) + // CHECK-ASM: vsqrtsh %xmm{{.*}}, + // COMMONIR-NEXT: extractelement <2 x half> %{{.*}}, i64 0 + // COMMONIR-NEXT: bitcast i8 %{{.*}} to <8 x i1> + // COMMONIR-NEXT: extractelement <8 x i1> %{{.*}}, i64 0 + // COMMONIR-NEXT: select i1 {{.*}}, half {{.*}}, half {{.*}} + // COMMONIR-NEXT: insertelement <2 x half> %{{.*}}, half {{.*}}, i64 0 + return _mm_maskz_sqrt_sh(__U,__A,__B); +} + +__m512h test_mm512_sqrt_ph(__m512h x) { + // COMMON-LABEL: test_mm512_sqrt_ph + // UNCONSTRAINED: call {{.*}}<32 x half> @llvm.sqrt.v32f16(<32 x half> {{.*}}) + // CONSTRAINED: call {{.*}}<32 x half> @llvm.experimental.constrained.sqrt.v32f16(<32 x half> {{.*}}, metadata !{{.*}}) + // CHECK-ASM: vsqrtph %zmm{{.*}}, + return _mm512_sqrt_ph(x); +} + +__m512h test_mm512_mask_sqrt_ph (__m512h __W, __mmask32 __U, __m512h __A) +{ + // COMMON-LABEL: test_mm512_mask_sqrt_ph + // UNCONSTRAINED: call <32 x half> @llvm.sqrt.v32f16(<32 x half> %{{.*}}) + // CONSTRAINED: call <32 x half> @llvm.experimental.constrained.sqrt.v32f16(<32 x half> %{{.*}}, metadata !{{.*}}) + // CHECK-ASM: vsqrtph %zmm{{.*}}, + // COMMONIR: bitcast i32 %{{.*}} to <32 x i1> + // COMMONIR: select <32 x i1> %{{.*}}, <32 x half> %{{.*}}, <32 x half> %{{.*}} + return _mm512_mask_sqrt_ph (__W,__U,__A); +} + +__m512h test_mm512_maskz_sqrt_ph (__mmask32 __U, __m512h __A) +{ + // COMMON-LABEL: test_mm512_maskz_sqrt_ph + // UNCONSTRAINED: call <32 x half> @llvm.sqrt.v32f16(<32 x half> %{{.*}}) + // CONSTRAINED: call <32 x half> @llvm.experimental.constrained.sqrt.v32f16(<32 x half> %{{.*}}, metadata !{{.*}}) + // CHECK-ASM: vsqrtph %zmm{{.*}}, + // COMMONIR: bitcast i32 %{{.*}} to <32 x i1> + // COMMONIR: select <32 x i1> %{{.*}}, <32 x half> %{{.*}}, <32 x half> {{.*}} + return _mm512_maskz_sqrt_ph (__U,__A); +}