| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,50 @@ | ||
| // RUN: %clang_cc1 -ffreestanding %s -Wno-implicit-function-declaration -triple=i386-- -target-feature +movrs -target-feature +avx10.2-512 -emit-llvm -verify | ||
|
|
||
| #include <immintrin.h> | ||
| __m512i test_mm512_loadrs_epi8(const __m512i * __A) { | ||
| return _mm512_loadrs_epi8(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_mask_loadrs_epi8(__m512i __A, __mmask64 __B, const __m512i * __C) { | ||
| return _mm512_mask_loadrs_epi8(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_maskz_loadrs_epi8(__mmask64 __A, const __m512i * __B) { | ||
| return _mm512_maskz_loadrs_epi8(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_loadrs_epi32(const __m512i * __A) { | ||
| return _mm512_loadrs_epi32(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_mask_loadrs_epi32(__m512i __A, __mmask16 __B, const __m512i * __C) { | ||
| return _mm512_mask_loadrs_epi32(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_maskz_loadrs_epi32(__mmask16 __A, const __m512i * __B) { | ||
| return _mm512_maskz_loadrs_epi32(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_loadrs_epi64(const __m512i * __A) { | ||
| return _mm512_loadrs_epi64(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_mask_loadrs_epi64(__m512i __A, __mmask8 __B, const __m512i * __C) { | ||
| return _mm512_mask_loadrs_epi64(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_maskz_loadrs_epi64(__mmask8 __A, const __m512i * __B) { | ||
| return _mm512_maskz_loadrs_epi64(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_loadrs_epi16(const __m512i * __A) { | ||
| return _mm512_loadrs_epi16(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_mask_loadrs_epi16(__m512i __A, __mmask32 __B, const __m512i * __C) { | ||
| return _mm512_mask_loadrs_epi16(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } | ||
|
|
||
| __m512i test_mm512_maskz_loadrs_epi16(__mmask32 __A, const __m512i * __B) { | ||
| return _mm512_maskz_loadrs_epi16(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m512i' (vector of 8 'long long' values)}} | ||
| } |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,87 @@ | ||
| // RUN: %clang_cc1 -ffreestanding %s -triple=x86_64-- -target-feature +movrs -target-feature +avx10.2-512 -emit-llvm -o - -Wall -Werror | FileCheck %s | ||
|
|
||
| #include <immintrin.h> | ||
|
|
||
| __m512i test_mm512_loadrs_epi8(const __m512i * __A) { | ||
| // CHECK-LABEL: @test_mm512_loadrs_epi8( | ||
| // CHECK: call <64 x i8> @llvm.x86.avx10.vmovrsb512( | ||
| return _mm512_loadrs_epi8(__A); | ||
| } | ||
|
|
||
| __m512i test_mm512_mask_loadrs_epi8(__m512i __A, __mmask64 __B, const __m512i * __C) { | ||
| // CHECK-LABEL: @test_mm512_mask_loadrs_epi8( | ||
| // CHECK: call <64 x i8> @llvm.x86.avx10.vmovrsb512( | ||
| // CHECK: select <64 x i1> %{{.*}}, <64 x i8> %{{.*}}, <64 x i8> %{{.*}} | ||
| return _mm512_mask_loadrs_epi8(__A, __B, __C); | ||
| } | ||
|
|
||
| __m512i test_mm512_maskz_loadrs_epi8(__mmask64 __A, const __m512i * __B) { | ||
| // CHECK-LABEL: @test_mm512_maskz_loadrs_epi8( | ||
| // CHECK: call <64 x i8> @llvm.x86.avx10.vmovrsb512( | ||
| // CHECK: store <8 x i64> zeroinitializer | ||
| // CHECK: select <64 x i1> %{{.*}}, <64 x i8> %{{.*}}, <64 x i8> %{{.*}} | ||
| return _mm512_maskz_loadrs_epi8(__A, __B); | ||
| } | ||
|
|
||
| __m512i test_mm512_loadrs_epi32(const __m512i * __A) { | ||
| // CHECK-LABEL: @test_mm512_loadrs_epi32( | ||
| // CHECK: call <16 x i32> @llvm.x86.avx10.vmovrsd512( | ||
| return _mm512_loadrs_epi32(__A); | ||
| } | ||
|
|
||
| __m512i test_mm512_mask_loadrs_epi32(__m512i __A, __mmask16 __B, const __m512i * __C) { | ||
| // CHECK-LABEL: @test_mm512_mask_loadrs_epi32( | ||
| // CHECK: call <16 x i32> @llvm.x86.avx10.vmovrsd512( | ||
| // CHECK: select <16 x i1> %{{.*}}, <16 x i32> %{{.*}}, <16 x i32> %{{.*}} | ||
| return _mm512_mask_loadrs_epi32(__A, __B, __C); | ||
| } | ||
|
|
||
| __m512i test_mm512_maskz_loadrs_epi32(__mmask16 __A, const __m512i * __B) { | ||
| // CHECK-LABEL: @test_mm512_maskz_loadrs_epi32( | ||
| // CHECK: call <16 x i32> @llvm.x86.avx10.vmovrsd512( | ||
| // CHECK: store <8 x i64> zeroinitializer | ||
| // CHECK: select <16 x i1> %{{.*}}, <16 x i32> %{{.*}}, <16 x i32> %{{.*}} | ||
| return _mm512_maskz_loadrs_epi32(__A, __B); | ||
| } | ||
|
|
||
| __m512i test_mm512_loadrs_epi64(const __m512i * __A) { | ||
| // CHECK-LABEL: @test_mm512_loadrs_epi64( | ||
| // CHECK: call <8 x i64> @llvm.x86.avx10.vmovrsq512( | ||
| return _mm512_loadrs_epi64(__A); | ||
| } | ||
|
|
||
| __m512i test_mm512_mask_loadrs_epi64(__m512i __A, __mmask8 __B, const __m512i * __C) { | ||
| // CHECK-LABEL: @test_mm512_mask_loadrs_epi64( | ||
| // CHECK: call <8 x i64> @llvm.x86.avx10.vmovrsq512( | ||
| // CHECK: select <8 x i1> %{{.*}}, <8 x i64> %{{.*}}, <8 x i64> %{{.*}} | ||
| return _mm512_mask_loadrs_epi64(__A, __B, __C); | ||
| } | ||
|
|
||
| __m512i test_mm512_maskz_loadrs_epi64(__mmask8 __A, const __m512i * __B) { | ||
| // CHECK-LABEL: @test_mm512_maskz_loadrs_epi64( | ||
| // CHECK: call <8 x i64> @llvm.x86.avx10.vmovrsq512( | ||
| // CHECK: store <8 x i64> zeroinitializer | ||
| // CHECK: select <8 x i1> %{{.*}}, <8 x i64> %{{.*}}, <8 x i64> %{{.*}} | ||
| return _mm512_maskz_loadrs_epi64(__A, __B); | ||
| } | ||
|
|
||
| __m512i test_mm512_loadrs_epi16(const __m512i * __A) { | ||
| // CHECK-LABEL: @test_mm512_loadrs_epi16( | ||
| // CHECK: call <32 x i16> @llvm.x86.avx10.vmovrsw512( | ||
| return _mm512_loadrs_epi16(__A); | ||
| } | ||
|
|
||
| __m512i test_mm512_mask_loadrs_epi16(__m512i __A, __mmask32 __B, const __m512i * __C) { | ||
| // CHECK-LABEL: @test_mm512_mask_loadrs_epi16( | ||
| // CHECK: call <32 x i16> @llvm.x86.avx10.vmovrsw512( | ||
| // CHECK: select <32 x i1> %{{.*}}, <32 x i16> %{{.*}}, <32 x i16> %{{.*}} | ||
| return _mm512_mask_loadrs_epi16(__A, __B, __C); | ||
| } | ||
|
|
||
| __m512i test_mm512_maskz_loadrs_epi16(__mmask32 __A, const __m512i * __B) { | ||
| // CHECK-LABEL: @test_mm512_maskz_loadrs_epi16( | ||
| // CHECK: call <32 x i16> @llvm.x86.avx10.vmovrsw512( | ||
| // CHECK: store <8 x i64> zeroinitializer | ||
| // CHECK: select <32 x i1> %{{.*}}, <32 x i16> %{{.*}}, <32 x i16> %{{.*}} | ||
| return _mm512_maskz_loadrs_epi16(__A, __B); | ||
| } |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,98 @@ | ||
| // RUN: %clang_cc1 -ffreestanding %s -Wno-implicit-function-declaration -triple=i386-unknown-unknown -target-feature +movrs -target-feature +avx10.2-256 -emit-llvm -verify | ||
|
|
||
| #include <immintrin.h> | ||
| __m128i test_mm_loadrs_epi8(const __m128i * __A) { | ||
| return _mm_loadrs_epi8(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_mask_loadrs_epi8(__m128i __A, __mmask16 __B, const __m128i * __C) { | ||
| return _mm_mask_loadrs_epi8(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_maskz_loadrs_epi8(__mmask16 __A, const __m128i * __B) { | ||
| return _mm_maskz_loadrs_epi8(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_loadrs_epi8(const __m256i * __A) { | ||
| return _mm256_loadrs_epi8(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_mask_loadrs_epi8(__m256i __A, __mmask32 __B, const __m256i * __C) { | ||
| return _mm256_mask_loadrs_epi8(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_maskz_loadrs_epi8(__mmask32 __A, const __m256i * __B) { | ||
| return _mm256_maskz_loadrs_epi8(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_loadrs_epi32(const __m128i * __A) { | ||
| return _mm_loadrs_epi32(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_mask_loadrs_epi32(__m128i __A, __mmask8 __B, const __m128i * __C) { | ||
| return _mm_mask_loadrs_epi32(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_maskz_loadrs_epi32(__mmask8 __A, const __m128i * __B) { | ||
| return _mm_maskz_loadrs_epi32(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_loadrs_epi32(const __m256i * __A) { | ||
| return _mm256_loadrs_epi32(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_mask_loadrs_epi32(__m256i __A, __mmask8 __B, const __m256i * __C) { | ||
| return _mm256_mask_loadrs_epi32(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_maskz_loadrs_epi32(__mmask8 __A, const __m256i * __B) { | ||
| return _mm256_maskz_loadrs_epi32(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_loadrs_epi64(const __m128i * __A) { | ||
| return _mm_loadrs_epi64(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_mask_loadrs_epi64(__m128i __A, __mmask8 __B, const __m128i * __C) { | ||
| return _mm_mask_loadrs_epi64(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_maskz_loadrs_epi64(__mmask8 __A, const __m128i * __B) { | ||
| return _mm_maskz_loadrs_epi64(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_loadrs_epi64(const __m256i * __A) { | ||
| return _mm256_loadrs_epi64(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_mask_loadrs_epi64(__m256i __A, __mmask8 __B, const __m256i * __C) { | ||
| return _mm256_mask_loadrs_epi64(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_maskz_loadrs_epi64(__mmask8 __A, const __m256i * __B) { | ||
| return _mm256_maskz_loadrs_epi64(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_loadrs_epi16(const __m128i * __A) { | ||
| return _mm_loadrs_epi16(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_mask_loadrs_epi16(__m128i __A, __mmask8 __B, const __m128i * __C) { | ||
| return _mm_mask_loadrs_epi16(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m128i test_mm_maskz_loadrs_epi16(__mmask8 __A, const __m128i * __B) { | ||
| return _mm_maskz_loadrs_epi16(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m128i' (vector of 2 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_loadrs_epi16(const __m256i * __A) { | ||
| return _mm256_loadrs_epi16(__A); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_mask_loadrs_epi16(__m256i __A, __mmask16 __B, const __m256i * __C) { | ||
| return _mm256_mask_loadrs_epi16(__A, __B, __C); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } | ||
|
|
||
| __m256i test_mm256_maskz_loadrs_epi16(__mmask16 __A, const __m256i * __B) { | ||
| return _mm256_maskz_loadrs_epi16(__A, __B); // expected-error {{returning 'int' from a function with incompatible result type '__m256i' (vector of 4 'long long' values)}} | ||
| } |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,171 @@ | ||
| // RUN: %clang_cc1 -ffreestanding %s -triple=x86_64-- -target-feature +movrs -target-feature +avx10.2-256 -emit-llvm -o - -Wall -Werror | FileCheck %s | ||
|
|
||
| #include <immintrin.h> | ||
|
|
||
| __m128i test_mm_loadrs_epi8(const __m128i * __A) { | ||
| // CHECK-LABEL: @test_mm_loadrs_epi8( | ||
| // CHECK: call <16 x i8> @llvm.x86.avx10.vmovrsb128( | ||
| return _mm_loadrs_epi8(__A); | ||
| } | ||
|
|
||
| __m128i test_mm_mask_loadrs_epi8(__m128i __A, __mmask16 __B, const __m128i * __C) { | ||
| // CHECK-LABEL: @test_mm_mask_loadrs_epi8( | ||
| // CHECK: call <16 x i8> @llvm.x86.avx10.vmovrsb128( | ||
| // CHECK: select <16 x i1> %{{.*}}, <16 x i8> %{{.*}}, <16 x i8> %{{.*}} | ||
| return _mm_mask_loadrs_epi8(__A, __B, __C); | ||
| } | ||
|
|
||
| __m128i test_mm_maskz_loadrs_epi8(__mmask16 __A, const __m128i * __B) { | ||
| // CHECK-LABEL: @test_mm_maskz_loadrs_epi8( | ||
| // CHECK: call <16 x i8> @llvm.x86.avx10.vmovrsb128( | ||
| // CHECK: store <2 x i64> zeroinitializer | ||
| // CHECK: select <16 x i1> %{{.*}}, <16 x i8> %{{.*}}, <16 x i8> %{{.*}} | ||
| return _mm_maskz_loadrs_epi8(__A, __B); | ||
| } | ||
|
|
||
| __m256i test_mm256_loadrs_epi8(const __m256i * __A) { | ||
| // CHECK-LABEL: @test_mm256_loadrs_epi8( | ||
| // CHECK: call <32 x i8> @llvm.x86.avx10.vmovrsb256( | ||
| return _mm256_loadrs_epi8(__A); | ||
| } | ||
|
|
||
| __m256i test_mm256_mask_loadrs_epi8(__m256i __A, __mmask32 __B, const __m256i * __C) { | ||
| // CHECK-LABEL: @test_mm256_mask_loadrs_epi8( | ||
| // CHECK: call <32 x i8> @llvm.x86.avx10.vmovrsb256( | ||
| // CHECK: select <32 x i1> %{{.*}}, <32 x i8> %{{.*}}, <32 x i8> %{{.*}} | ||
| return _mm256_mask_loadrs_epi8(__A, __B, __C); | ||
| } | ||
|
|
||
| __m256i test_mm256_maskz_loadrs_epi8(__mmask32 __A, const __m256i * __B) { | ||
| // CHECK-LABEL: @test_mm256_maskz_loadrs_epi8( | ||
| // CHECK: call <32 x i8> @llvm.x86.avx10.vmovrsb256( | ||
| // CHECK: store <4 x i64> zeroinitializer | ||
| // CHECK: select <32 x i1> %{{.*}}, <32 x i8> %{{.*}}, <32 x i8> %{{.*}} | ||
| return _mm256_maskz_loadrs_epi8(__A, __B); | ||
| } | ||
|
|
||
| __m128i test_mm_loadrs_epi32(const __m128i * __A) { | ||
| // CHECK-LABEL: @test_mm_loadrs_epi32( | ||
| // CHECK: call <4 x i32> @llvm.x86.avx10.vmovrsd128( | ||
| return _mm_loadrs_epi32(__A); | ||
| } | ||
|
|
||
| __m128i test_mm_mask_loadrs_epi32(__m128i __A, __mmask8 __B, const __m128i * __C) { | ||
| // CHECK-LABEL: @test_mm_mask_loadrs_epi32( | ||
| // CHECK: call <4 x i32> @llvm.x86.avx10.vmovrsd128( | ||
| // CHECK: select <4 x i1> %{{.*}}, <4 x i32> %{{.*}}, <4 x i32> %{{.*}} | ||
| return _mm_mask_loadrs_epi32(__A, __B, __C); | ||
| } | ||
|
|
||
| __m128i test_mm_maskz_loadrs_epi32(__mmask8 __A, const __m128i * __B) { | ||
| // CHECK-LABEL: @test_mm_maskz_loadrs_epi32( | ||
| // CHECK: call <4 x i32> @llvm.x86.avx10.vmovrsd128( | ||
| // CHECK: store <2 x i64> zeroinitializer | ||
| // CHECK: select <4 x i1> %{{.*}}, <4 x i32> %{{.*}}, <4 x i32> %{{.*}} | ||
| return _mm_maskz_loadrs_epi32(__A, __B); | ||
| } | ||
|
|
||
| __m256i test_mm256_loadrs_epi32(const __m256i * __A) { | ||
| // CHECK-LABEL: @test_mm256_loadrs_epi32( | ||
| // CHECK: call <8 x i32> @llvm.x86.avx10.vmovrsd256( | ||
| return _mm256_loadrs_epi32(__A); | ||
| } | ||
|
|
||
| __m256i test_mm256_mask_loadrs_epi32(__m256i __A, __mmask8 __B, const __m256i * __C) { | ||
| // CHECK-LABEL: @test_mm256_mask_loadrs_epi32( | ||
| // CHECK: call <8 x i32> @llvm.x86.avx10.vmovrsd256( | ||
| // CHECK: select <8 x i1> %{{.*}}, <8 x i32> %{{.*}}, <8 x i32> %{{.*}} | ||
| return _mm256_mask_loadrs_epi32(__A, __B, __C); | ||
| } | ||
|
|
||
| __m256i test_mm256_maskz_loadrs_epi32(__mmask8 __A, const __m256i * __B) { | ||
| // CHECK-LABEL: @test_mm256_maskz_loadrs_epi32( | ||
| // CHECK: call <8 x i32> @llvm.x86.avx10.vmovrsd256( | ||
| // CHECK: store <4 x i64> zeroinitializer | ||
| // CHECK: select <8 x i1> %{{.*}}, <8 x i32> %{{.*}}, <8 x i32> %{{.*}} | ||
| return _mm256_maskz_loadrs_epi32(__A, __B); | ||
| } | ||
|
|
||
| __m128i test_mm_loadrs_epi64(const __m128i * __A) { | ||
| // CHECK-LABEL: @test_mm_loadrs_epi64( | ||
| // CHECK: call <2 x i64> @llvm.x86.avx10.vmovrsq128( | ||
| return _mm_loadrs_epi64(__A); | ||
| } | ||
|
|
||
| __m128i test_mm_mask_loadrs_epi64(__m128i __A, __mmask8 __B, const __m128i * __C) { | ||
| // CHECK-LABEL: @test_mm_mask_loadrs_epi64( | ||
| // CHECK: call <2 x i64> @llvm.x86.avx10.vmovrsq128( | ||
| // CHECK: select <2 x i1> %{{.*}}, <2 x i64> %{{.*}}, <2 x i64> %{{.*}} | ||
| return _mm_mask_loadrs_epi64(__A, __B, __C); | ||
| } | ||
|
|
||
| __m128i test_mm_maskz_loadrs_epi64(__mmask8 __A, const __m128i * __B) { | ||
| // CHECK-LABEL: @test_mm_maskz_loadrs_epi64( | ||
| // CHECK: call <2 x i64> @llvm.x86.avx10.vmovrsq128( | ||
| // CHECK: store <2 x i64> zeroinitializer | ||
| // CHECK: select <2 x i1> %{{.*}}, <2 x i64> %{{.*}}, <2 x i64> %{{.*}} | ||
| return _mm_maskz_loadrs_epi64(__A, __B); | ||
| } | ||
|
|
||
| __m256i test_mm256_loadrs_epi64(const __m256i * __A) { | ||
| // CHECK-LABEL: @test_mm256_loadrs_epi64( | ||
| // CHECK: call <4 x i64> @llvm.x86.avx10.vmovrsq256( | ||
| return _mm256_loadrs_epi64(__A); | ||
| } | ||
|
|
||
| __m256i test_mm256_mask_loadrs_epi64(__m256i __A, __mmask8 __B, const __m256i * __C) { | ||
| // CHECK-LABEL: @test_mm256_mask_loadrs_epi64( | ||
| // CHECK: call <4 x i64> @llvm.x86.avx10.vmovrsq256( | ||
| // CHECK: select <4 x i1> %{{.*}}, <4 x i64> %{{.*}}, <4 x i64> %{{.*}} | ||
| return _mm256_mask_loadrs_epi64(__A, __B, __C); | ||
| } | ||
|
|
||
| __m256i test_mm256_maskz_loadrs_epi64(__mmask8 __A, const __m256i * __B) { | ||
| // CHECK-LABEL: @test_mm256_maskz_loadrs_epi64( | ||
| // CHECK: call <4 x i64> @llvm.x86.avx10.vmovrsq256( | ||
| // CHECK: store <4 x i64> zeroinitializer | ||
| // CHECK: select <4 x i1> %{{.*}}, <4 x i64> %{{.*}}, <4 x i64> %{{.*}} | ||
| return _mm256_maskz_loadrs_epi64(__A, __B); | ||
| } | ||
|
|
||
| __m128i test_mm_loadrs_epi16(const __m128i * __A) { | ||
| // CHECK-LABEL: @test_mm_loadrs_epi16( | ||
| // CHECK: call <8 x i16> @llvm.x86.avx10.vmovrsw128( | ||
| return _mm_loadrs_epi16(__A); | ||
| } | ||
|
|
||
| __m128i test_mm_mask_loadrs_epi16(__m128i __A, __mmask8 __B, const __m128i * __C) { | ||
| // CHECK-LABEL: @test_mm_mask_loadrs_epi16( | ||
| // CHECK: call <8 x i16> @llvm.x86.avx10.vmovrsw128( | ||
| // CHECK: select <8 x i1> %{{.*}}, <8 x i16> %{{.*}}, <8 x i16> %{{.*}} | ||
| return _mm_mask_loadrs_epi16(__A, __B, __C); | ||
| } | ||
|
|
||
| __m128i test_mm_maskz_loadrs_epi16(__mmask8 __A, const __m128i * __B) { | ||
| // CHECK-LABEL: @test_mm_maskz_loadrs_epi16( | ||
| // CHECK: call <8 x i16> @llvm.x86.avx10.vmovrsw128( | ||
| // CHECK: store <2 x i64> zeroinitializer | ||
| // CHECK: select <8 x i1> %{{.*}}, <8 x i16> %{{.*}}, <8 x i16> %{{.*}} | ||
| return _mm_maskz_loadrs_epi16(__A, __B); | ||
| } | ||
|
|
||
| __m256i test_mm256_loadrs_epi16(const __m256i * __A) { | ||
| // CHECK-LABEL: @test_mm256_loadrs_epi16( | ||
| // CHECK: call <16 x i16> @llvm.x86.avx10.vmovrsw256( | ||
| return _mm256_loadrs_epi16(__A); | ||
| } | ||
|
|
||
| __m256i test_mm256_mask_loadrs_epi16(__m256i __A, __mmask16 __B, const __m256i * __C) { | ||
| // CHECK-LABEL: @test_mm256_mask_loadrs_epi16( | ||
| // CHECK: call <16 x i16> @llvm.x86.avx10.vmovrsw256( | ||
| // CHECK: select <16 x i1> %{{.*}}, <16 x i16> %{{.*}}, <16 x i16> %{{.*}} | ||
| return _mm256_mask_loadrs_epi16(__A, __B, __C); | ||
| } | ||
|
|
||
| __m256i test_mm256_maskz_loadrs_epi16(__mmask16 __A, const __m256i * __B) { | ||
| // CHECK-LABEL: @test_mm256_maskz_loadrs_epi16( | ||
| // CHECK: call <16 x i16> @llvm.x86.avx10.vmovrsw256( | ||
| // CHECK: store <4 x i64> zeroinitializer | ||
| // CHECK: select <16 x i1> %{{.*}}, <16 x i16> %{{.*}}, <16 x i16> %{{.*}} | ||
| return _mm256_maskz_loadrs_epi16(__A, __B); | ||
| } |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -52,7 +52,6 @@ | |
| ; NM1: T f | ||
| ; NM2: T g | ||
|
|
||
| target triple = "wasm32-unknown-unknown" | ||
|
|
||
| declare void @g(...) | ||
|
|
||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,163 @@ | ||
| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py | ||
| ; RUN: llc < %s -mtriple=x86_64-- -mattr=+movrs,+avx10.2-512 -verify-machineinstrs --show-mc-encoding | FileCheck %s --check-prefixes=CHECK | ||
|
|
||
| declare <64 x i8> @llvm.x86.avx10.vmovrsb512(ptr) | ||
| declare <16 x i32> @llvm.x86.avx10.vmovrsd512(ptr) | ||
| declare <8 x i64> @llvm.x86.avx10.vmovrsq512(ptr) | ||
| declare <32 x i16> @llvm.x86.avx10.vmovrsw512(ptr) | ||
|
|
||
| define <8 x i64> @test_mm512_movrsb_epi8(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm512_movrsb_epi8: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsb (%rdi), %zmm0 # encoding: [0x62,0xf5,0x7f,0x48,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <64 x i8> @llvm.x86.avx10.vmovrsb512(ptr %__A) | ||
| %1 = bitcast <64 x i8> %0 to <8 x i64> | ||
| ret <8 x i64> %1 | ||
| } | ||
|
|
||
| define <8 x i64> @test_mm512_mask_movrsb_epi8(<8 x i64> %__A, i64 %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm512_mask_movrsb_epi8: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovq %rdi, %k1 # encoding: [0xc4,0xe1,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsb (%rsi), %zmm0 {%k1} # encoding: [0x62,0xf5,0x7f,0x49,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <64 x i8> @llvm.x86.avx10.vmovrsb512(ptr %__C) | ||
| %1 = bitcast <8 x i64> %__A to <64 x i8> | ||
| %2 = bitcast i64 %__B to <64 x i1> | ||
| %3 = select <64 x i1> %2, <64 x i8> %0, <64 x i8> %1 | ||
| %4 = bitcast <64 x i8> %3 to <8 x i64> | ||
| ret <8 x i64> %4 | ||
| } | ||
|
|
||
| define dso_local <8 x i64> @test_mm512_maskz_movrsb_epi8(i64 %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm512_maskz_movrsb_epi8: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovq %rdi, %k1 # encoding: [0xc4,0xe1,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsb (%rsi), %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7f,0xc9,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <64 x i8> @llvm.x86.avx10.vmovrsb512(ptr %__B) | ||
| %1 = bitcast i64 %__A to <64 x i1> | ||
| %2 = select <64 x i1> %1, <64 x i8> %0, <64 x i8> zeroinitializer | ||
| %3 = bitcast <64 x i8> %2 to <8 x i64> | ||
| ret <8 x i64> %3 | ||
| } | ||
|
|
||
| define <8 x i64> @test_mm512_movrsd_epi32(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm512_movrsd_epi32: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsd (%rdi), %zmm0 # encoding: [0x62,0xf5,0x7e,0x48,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <16 x i32> @llvm.x86.avx10.vmovrsd512(ptr %__A) | ||
| %1 = bitcast <16 x i32> %0 to <8 x i64> | ||
| ret <8 x i64> %1 | ||
| } | ||
|
|
||
| define <8 x i64> @test_mm512_mask_movrsd_epi32(<8 x i64> %__A, i16 zeroext %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm512_mask_movrsd_epi32: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsd (%rsi), %zmm0 {%k1} # encoding: [0x62,0xf5,0x7e,0x49,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <16 x i32> @llvm.x86.avx10.vmovrsd512(ptr %__C) | ||
| %1 = bitcast <8 x i64> %__A to <16 x i32> | ||
| %2 = bitcast i16 %__B to <16 x i1> | ||
| %3 = select <16 x i1> %2, <16 x i32> %0, <16 x i32> %1 | ||
| %4 = bitcast <16 x i32> %3 to <8 x i64> | ||
| ret <8 x i64> %4 | ||
| } | ||
|
|
||
| define <8 x i64> @test_mm512_maskz_movrsd_epi32(i16 zeroext %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm512_maskz_movrsd_epi32: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsd (%rsi), %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7e,0xc9,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <16 x i32> @llvm.x86.avx10.vmovrsd512(ptr %__B) | ||
| %1 = bitcast i16 %__A to <16 x i1> | ||
| %2 = select <16 x i1> %1, <16 x i32> %0, <16 x i32> zeroinitializer | ||
| %3 = bitcast <16 x i32> %2 to <8 x i64> | ||
| ret <8 x i64> %3 | ||
| } | ||
|
|
||
| define <8 x i64> @test_mm512_movrsq_epi64(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm512_movrsq_epi64: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsq (%rdi), %zmm0 # encoding: [0x62,0xf5,0xfe,0x48,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <8 x i64> @llvm.x86.avx10.vmovrsq512(ptr %__A) | ||
| ret <8 x i64> %0 | ||
| } | ||
|
|
||
| define <8 x i64> @test_mm512_mask_movrsq_epi64(<8 x i64> %__A, i8 zeroext %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm512_mask_movrsq_epi64: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsq (%rsi), %zmm0 {%k1} # encoding: [0x62,0xf5,0xfe,0x49,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <8 x i64> @llvm.x86.avx10.vmovrsq512(ptr %__C) | ||
| %1 = bitcast i8 %__B to <8 x i1> | ||
| %2 = select <8 x i1> %1, <8 x i64> %0, <8 x i64> %__A | ||
| ret <8 x i64> %2 | ||
| } | ||
|
|
||
| define <8 x i64> @test_mm512_maskz_movrsq_epi64(i8 zeroext %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm512_maskz_movrsq_epi64: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsq (%rsi), %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0xfe,0xc9,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <8 x i64> @llvm.x86.avx10.vmovrsq512(ptr %__B) | ||
| %1 = bitcast i8 %__A to <8 x i1> | ||
| %2 = select <8 x i1> %1, <8 x i64> %0, <8 x i64> zeroinitializer | ||
| ret <8 x i64> %2 | ||
| } | ||
|
|
||
| define <8 x i64> @test_mm512_movrsw_epi16(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm512_movrsw_epi16: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsw (%rdi), %zmm0 # encoding: [0x62,0xf5,0xff,0x48,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <32 x i16> @llvm.x86.avx10.vmovrsw512(ptr %__A) | ||
| %1 = bitcast <32 x i16> %0 to <8 x i64> | ||
| ret <8 x i64> %1 | ||
| } | ||
|
|
||
| define <8 x i64> @test_mm512_mask_movrsw_epi16(<8 x i64> %__A, i32 %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm512_mask_movrsw_epi16: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsw (%rsi), %zmm0 {%k1} # encoding: [0x62,0xf5,0xff,0x49,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <32 x i16> @llvm.x86.avx10.vmovrsw512(ptr %__C) | ||
| %1 = bitcast <8 x i64> %__A to <32 x i16> | ||
| %2 = bitcast i32 %__B to <32 x i1> | ||
| %3 = select <32 x i1> %2, <32 x i16> %0, <32 x i16> %1 | ||
| %4 = bitcast <32 x i16> %3 to <8 x i64> | ||
| ret <8 x i64> %4 | ||
| } | ||
|
|
||
| define <8 x i64> @test_mm512_maskz_movrsw_epi16(i32 %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm512_maskz_movrsw_epi16: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsw (%rsi), %zmm0 {%k1} {z} # encoding: [0x62,0xf5,0xff,0xc9,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <32 x i16> @llvm.x86.avx10.vmovrsw512(ptr %__B) | ||
| %1 = bitcast i32 %__A to <32 x i1> | ||
| %2 = select <32 x i1> %1, <32 x i16> %0, <32 x i16> zeroinitializer | ||
| %3 = bitcast <32 x i16> %2 to <8 x i64> | ||
| ret <8 x i64> %3 | ||
| } |
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -0,0 +1,329 @@ | ||
| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py | ||
| ; RUN: llc < %s -mtriple=x86_64-- -mattr=+movrs,+avx10.2-256 -verify-machineinstrs --show-mc-encoding | FileCheck %s --check-prefixes=CHECK | ||
|
|
||
| define <2 x i64> @test_mm_movrsb_epu8(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm_movrsb_epu8: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsb (%rdi), %xmm0 # encoding: [0x62,0xf5,0x7f,0x08,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <16 x i8> @llvm.x86.avx10.vmovrsb128(ptr %__A) | ||
| %1 = bitcast <16 x i8> %0 to <2 x i64> | ||
| ret <2 x i64> %1 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_mask_movrsb_epu8(<2 x i64> %__A, i16 zeroext %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm_mask_movrsb_epu8: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsb (%rsi), %xmm0 {%k1} # encoding: [0x62,0xf5,0x7f,0x09,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <16 x i8> @llvm.x86.avx10.vmovrsb128(ptr %__C) | ||
| %1 = bitcast <2 x i64> %__A to <16 x i8> | ||
| %2 = bitcast i16 %__B to <16 x i1> | ||
| %3 = select <16 x i1> %2, <16 x i8> %0, <16 x i8> %1 | ||
| %4 = bitcast <16 x i8> %3 to <2 x i64> | ||
| ret <2 x i64> %4 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_maskz_movrsb_epu8(i16 zeroext %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm_maskz_movrsb_epu8: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsb (%rsi), %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7f,0x89,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <16 x i8> @llvm.x86.avx10.vmovrsb128(ptr %__B ) | ||
| %1 = bitcast i16 %__A to <16 x i1> | ||
| %2 = select <16 x i1> %1, <16 x i8> %0, <16 x i8> zeroinitializer | ||
| %3 = bitcast <16 x i8> %2 to <2 x i64> | ||
| ret <2 x i64> %3 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_movrsb_epu8(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm256_movrsb_epu8: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsb (%rdi), %ymm0 # encoding: [0x62,0xf5,0x7f,0x28,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <32 x i8> @llvm.x86.avx10.vmovrsb256(ptr %__A) | ||
| %1 = bitcast <32 x i8> %0 to <4 x i64> | ||
| ret <4 x i64> %1 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_mask_movrsb_epu8(<4 x i64> %__A, i32 %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm256_mask_movrsb_epu8: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsb (%rsi), %ymm0 {%k1} # encoding: [0x62,0xf5,0x7f,0x29,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <32 x i8> @llvm.x86.avx10.vmovrsb256(ptr %__C) | ||
| %1 = bitcast <4 x i64> %__A to <32 x i8> | ||
| %2 = bitcast i32 %__B to <32 x i1> | ||
| %3 = select <32 x i1> %2, <32 x i8> %0, <32 x i8> %1 | ||
| %4 = bitcast <32 x i8> %3 to <4 x i64> | ||
| ret <4 x i64> %4 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_maskz_movrsb_epu8(i32 %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm256_maskz_movrsb_epu8: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsb (%rsi), %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7f,0xa9,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <32 x i8> @llvm.x86.avx10.vmovrsb256(ptr %__B) | ||
| %1 = bitcast i32 %__A to <32 x i1> | ||
| %2 = select <32 x i1> %1, <32 x i8> %0, <32 x i8> zeroinitializer | ||
| %3 = bitcast <32 x i8> %2 to <4 x i64> | ||
| ret <4 x i64> %3 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_movrsd_epu32(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm_movrsd_epu32: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsd (%rdi), %xmm0 # encoding: [0x62,0xf5,0x7e,0x08,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <4 x i32> @llvm.x86.avx10.vmovrsd128(ptr %__A) | ||
| %1 = bitcast <4 x i32> %0 to <2 x i64> | ||
| ret <2 x i64> %1 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_mask_movrsd_epu32(<2 x i64> %__A, i8 zeroext %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm_mask_movrsd_epu32: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsd (%rsi), %xmm0 {%k1} # encoding: [0x62,0xf5,0x7e,0x09,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <4 x i32> @llvm.x86.avx10.vmovrsd128(ptr %__C) | ||
| %1 = bitcast <2 x i64> %__A to <4 x i32> | ||
| %2 = bitcast i8 %__B to <8 x i1> | ||
| %extract.i = shufflevector <8 x i1> %2, <8 x i1> poison, <4 x i32> <i32 0, i32 1, i32 2, i32 3> | ||
| %3 = select <4 x i1> %extract.i, <4 x i32> %0, <4 x i32> %1 | ||
| %4 = bitcast <4 x i32> %3 to <2 x i64> | ||
| ret <2 x i64> %4 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_maskz_movrsd_epu32(i8 zeroext %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm_maskz_movrsd_epu32: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsd (%rsi), %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0x7e,0x89,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <4 x i32> @llvm.x86.avx10.vmovrsd128(ptr %__B) | ||
| %1 = bitcast i8 %__A to <8 x i1> | ||
| %extract.i = shufflevector <8 x i1> %1, <8 x i1> poison, <4 x i32> <i32 0, i32 1, i32 2, i32 3> | ||
| %2 = select <4 x i1> %extract.i, <4 x i32> %0, <4 x i32> zeroinitializer | ||
| %3 = bitcast <4 x i32> %2 to <2 x i64> | ||
| ret <2 x i64> %3 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_movrsd_epu32(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm256_movrsd_epu32: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsd (%rdi), %ymm0 # encoding: [0x62,0xf5,0x7e,0x28,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <8 x i32> @llvm.x86.avx10.vmovrsd256(ptr %__A) | ||
| %1 = bitcast <8 x i32> %0 to <4 x i64> | ||
| ret <4 x i64> %1 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_mask_movrsd_epu32(<4 x i64> %__A, i8 zeroext %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm256_mask_movrsd_epu32: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsd (%rsi), %ymm0 {%k1} # encoding: [0x62,0xf5,0x7e,0x29,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <8 x i32> @llvm.x86.avx10.vmovrsd256(ptr %__C) | ||
| %1 = bitcast <4 x i64> %__A to <8 x i32> | ||
| %2 = bitcast i8 %__B to <8 x i1> | ||
| %3 = select <8 x i1> %2, <8 x i32> %0, <8 x i32> %1 | ||
| %4 = bitcast <8 x i32> %3 to <4 x i64> | ||
| ret <4 x i64> %4 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_maskz_movrsd_epu32(i8 zeroext %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm256_maskz_movrsd_epu32: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsd (%rsi), %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0x7e,0xa9,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <8 x i32> @llvm.x86.avx10.vmovrsd256(ptr %__B) | ||
| %1 = bitcast i8 %__A to <8 x i1> | ||
| %2 = select <8 x i1> %1, <8 x i32> %0, <8 x i32> zeroinitializer | ||
| %3 = bitcast <8 x i32> %2 to <4 x i64> | ||
| ret <4 x i64> %3 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_movrsq_epu64(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm_movrsq_epu64: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsq (%rdi), %xmm0 # encoding: [0x62,0xf5,0xfe,0x08,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <2 x i64> @llvm.x86.avx10.vmovrsq128(ptr %__A) | ||
| ret <2 x i64> %0 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_mask_movrsq_epu64(<2 x i64> %__A, i8 zeroext %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm_mask_movrsq_epu64: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsq (%rsi), %xmm0 {%k1} # encoding: [0x62,0xf5,0xfe,0x09,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <2 x i64> @llvm.x86.avx10.vmovrsq128(ptr %__C) | ||
| %1 = bitcast i8 %__B to <8 x i1> | ||
| %extract.i = shufflevector <8 x i1> %1, <8 x i1> poison, <2 x i32> <i32 0, i32 1> | ||
| %2 = select <2 x i1> %extract.i, <2 x i64> %0, <2 x i64> %__A | ||
| ret <2 x i64> %2 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_maskz_movrsq_epu64(i8 zeroext %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm_maskz_movrsq_epu64: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsq (%rsi), %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0xfe,0x89,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <2 x i64> @llvm.x86.avx10.vmovrsq128(ptr %__B) | ||
| %1 = bitcast i8 %__A to <8 x i1> | ||
| %extract.i = shufflevector <8 x i1> %1, <8 x i1> poison, <2 x i32> <i32 0, i32 1> | ||
| %2 = select <2 x i1> %extract.i, <2 x i64> %0, <2 x i64> zeroinitializer | ||
| ret <2 x i64> %2 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_movrsq_epu64(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm256_movrsq_epu64: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsq (%rdi), %ymm0 # encoding: [0x62,0xf5,0xfe,0x28,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <4 x i64> @llvm.x86.avx10.vmovrsq256(ptr %__A) | ||
| ret <4 x i64> %0 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_mask_movrsq_epu64(<4 x i64> %__A, i8 zeroext %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm256_mask_movrsq_epu64: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsq (%rsi), %ymm0 {%k1} # encoding: [0x62,0xf5,0xfe,0x29,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <4 x i64> @llvm.x86.avx10.vmovrsq256(ptr %__C) | ||
| %1 = bitcast i8 %__B to <8 x i1> | ||
| %extract.i = shufflevector <8 x i1> %1, <8 x i1> poison, <4 x i32> <i32 0, i32 1, i32 2, i32 3> | ||
| %2 = select <4 x i1> %extract.i, <4 x i64> %0, <4 x i64> %__A | ||
| ret <4 x i64> %2 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_maskz_movrsq_epu64(i8 zeroext %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm256_maskz_movrsq_epu64: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsq (%rsi), %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0xfe,0xa9,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <4 x i64> @llvm.x86.avx10.vmovrsq256(ptr %__B) | ||
| %1 = bitcast i8 %__A to <8 x i1> | ||
| %extract.i = shufflevector <8 x i1> %1, <8 x i1> poison, <4 x i32> <i32 0, i32 1, i32 2, i32 3> | ||
| %2 = select <4 x i1> %extract.i, <4 x i64> %0, <4 x i64> zeroinitializer | ||
| ret <4 x i64> %2 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_movrsw_epu16(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm_movrsw_epu16: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsw (%rdi), %xmm0 # encoding: [0x62,0xf5,0xff,0x08,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <8 x i16> @llvm.x86.avx10.vmovrsw128(ptr %__A) | ||
| %1 = bitcast <8 x i16> %0 to <2 x i64> | ||
| ret <2 x i64> %1 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_mask_movrsw_epu16(<2 x i64> %__A, i8 zeroext %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm_mask_movrsw_epu16: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsw (%rsi), %xmm0 {%k1} # encoding: [0x62,0xf5,0xff,0x09,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <8 x i16> @llvm.x86.avx10.vmovrsw128(ptr %__C) | ||
| %1 = bitcast <2 x i64> %__A to <8 x i16> | ||
| %2 = bitcast i8 %__B to <8 x i1> | ||
| %3 = select <8 x i1> %2, <8 x i16> %0, <8 x i16> %1 | ||
| %4 = bitcast <8 x i16> %3 to <2 x i64> | ||
| ret <2 x i64> %4 | ||
| } | ||
|
|
||
| define <2 x i64> @test_mm_maskz_movrsw_epu16(i8 zeroext %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm_maskz_movrsw_epu16: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsw (%rsi), %xmm0 {%k1} {z} # encoding: [0x62,0xf5,0xff,0x89,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <8 x i16> @llvm.x86.avx10.vmovrsw128(ptr %__B) | ||
| %1 = bitcast i8 %__A to <8 x i1> | ||
| %2 = select <8 x i1> %1, <8 x i16> %0, <8 x i16> zeroinitializer | ||
| %3 = bitcast <8 x i16> %2 to <2 x i64> | ||
| ret <2 x i64> %3 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_movrsw_epu16(ptr %__A) { | ||
| ; CHECK-LABEL: test_mm256_movrsw_epu16: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: vmovrsw (%rdi), %ymm0 # encoding: [0x62,0xf5,0xff,0x28,0x6f,0x07] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <16 x i16> @llvm.x86.avx10.vmovrsw256(ptr %__A) | ||
| %1 = bitcast <16 x i16> %0 to <4 x i64> | ||
| ret <4 x i64> %1 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_mask_movrsw_epu16(<4 x i64> %__A, i16 zeroext %__B, ptr %__C) { | ||
| ; CHECK-LABEL: test_mm256_mask_movrsw_epu16: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsw (%rsi), %ymm0 {%k1} # encoding: [0x62,0xf5,0xff,0x29,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <16 x i16> @llvm.x86.avx10.vmovrsw256(ptr %__C) | ||
| %1 = bitcast <4 x i64> %__A to <16 x i16> | ||
| %2 = bitcast i16 %__B to <16 x i1> | ||
| %3 = select <16 x i1> %2, <16 x i16> %0, <16 x i16> %1 | ||
| %4 = bitcast <16 x i16> %3 to <4 x i64> | ||
| ret <4 x i64> %4 | ||
| } | ||
|
|
||
| define <4 x i64> @test_mm256_maskz_movrsw_epu16(i16 zeroext %__A, ptr %__B) { | ||
| ; CHECK-LABEL: test_mm256_maskz_movrsw_epu16: | ||
| ; CHECK: # %bb.0: # %entry | ||
| ; CHECK-NEXT: kmovd %edi, %k1 # encoding: [0xc5,0xfb,0x92,0xcf] | ||
| ; CHECK-NEXT: vmovrsw (%rsi), %ymm0 {%k1} {z} # encoding: [0x62,0xf5,0xff,0xa9,0x6f,0x06] | ||
| ; CHECK-NEXT: retq # encoding: [0xc3] | ||
| entry: | ||
| %0 = tail call <16 x i16> @llvm.x86.avx10.vmovrsw256(ptr %__B) | ||
| %1 = bitcast i16 %__A to <16 x i1> | ||
| %2 = select <16 x i1> %1, <16 x i16> %0, <16 x i16> zeroinitializer | ||
| %3 = bitcast <16 x i16> %2 to <4 x i64> | ||
| ret <4 x i64> %3 | ||
| } | ||
|
|
||
| declare <16 x i8> @llvm.x86.avx10.vmovrsb128(ptr) | ||
| declare <32 x i8> @llvm.x86.avx10.vmovrsb256(ptr) | ||
| declare <4 x i32> @llvm.x86.avx10.vmovrsd128(ptr) | ||
| declare <8 x i32> @llvm.x86.avx10.vmovrsd256(ptr) | ||
| declare <2 x i64> @llvm.x86.avx10.vmovrsq128(ptr) | ||
| declare <4 x i64> @llvm.x86.avx10.vmovrsq256(ptr) | ||
| declare <8 x i16> @llvm.x86.avx10.vmovrsw128(ptr) | ||
| declare <16 x i16> @llvm.x86.avx10.vmovrsw256(ptr) |