Skip to content

Commit

Permalink
[SLP][NFC]Add a test for PR72202 to show a bug in a mask generation for
Browse files Browse the repository at this point in the history
vectorized extractelements operands.
  • Loading branch information
alexey-bataev committed Nov 16, 2023
1 parent ac4868e commit 181b2c1
Showing 1 changed file with 53 additions and 0 deletions.
Original file line number Diff line number Diff line change
@@ -0,0 +1,53 @@
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s

define double @test() {
; CHECK-LABEL: define double @test() {
; CHECK-NEXT: entry:
; CHECK-NEXT: [[TMP0:%.*]] = load <2 x double>, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 5), align 8
; CHECK-NEXT: [[TMP1:%.*]] = load <2 x double>, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 8), align 16
; CHECK-NEXT: [[TMP2:%.*]] = shufflevector <2 x double> [[TMP0]], <2 x double> [[TMP1]], <2 x i32> <i32 1, i32 3>
; CHECK-NEXT: [[TMP3:%.*]] = shufflevector <2 x double> [[TMP2]], <2 x double> poison, <4 x i32> <i32 0, i32 1, i32 poison, i32 poison>
; CHECK-NEXT: [[TMP4:%.*]] = fmul <4 x double> zeroinitializer, [[TMP3]]
; CHECK-NEXT: [[TMP5:%.*]] = call reassoc nsz double @llvm.vector.reduce.fadd.v4f64(double -0.000000e+00, <4 x double> [[TMP4]])
; CHECK-NEXT: [[TMP6:%.*]] = fmul double [[TMP5]], 0.000000e+00
; CHECK-NEXT: store double [[TMP6]], ptr null, align 16
; CHECK-NEXT: br label [[BB:%.*]]
; CHECK: bb:
; CHECK-NEXT: [[TMP7:%.*]] = fmul <2 x double> [[TMP1]], zeroinitializer
; CHECK-NEXT: [[TMP8:%.*]] = extractelement <2 x double> [[TMP7]], i32 0
; CHECK-NEXT: [[TMP9:%.*]] = extractelement <2 x double> [[TMP7]], i32 1
; CHECK-NEXT: [[TMP10:%.*]] = fadd double [[TMP8]], [[TMP9]]
; CHECK-NEXT: [[TMP11:%.*]] = fmul <2 x double> [[TMP0]], zeroinitializer
; CHECK-NEXT: [[TMP12:%.*]] = extractelement <2 x double> [[TMP11]], i32 1
; CHECK-NEXT: [[TMP13:%.*]] = fadd double [[TMP12]], [[TMP10]]
; CHECK-NEXT: [[TMP14:%.*]] = extractelement <2 x double> [[TMP11]], i32 0
; CHECK-NEXT: [[TMP15:%.*]] = fadd double [[TMP14]], [[TMP13]]
; CHECK-NEXT: ret double [[TMP15]]
;
entry:
%0 = fmul double 0.000000e+00, 0.000000e+00
%1 = fmul double 0.000000e+00, 0.000000e+00
%2 = fadd reassoc nsz double %1, %0
%3 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 5), align 8
%4 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 6), align 16
%5 = fmul double %4, 0.000000e+00
%6 = fadd reassoc nsz double %5, %2
%7 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 8), align 16
%8 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 9), align 8
%9 = fmul double %8, 0.000000e+00
%10 = fadd reassoc nsz double %9, %6
%11 = fmul double %10, 0.000000e+00
store double %11, ptr null, align 16
br label %bb

bb:
%12 = fmul double %8, 0.000000e+00
%13 = fmul double %7, 0.000000e+00
%14 = fadd double %13, %12
%15 = fmul double %4, 0.000000e+00
%16 = fadd double %15, %14
%17 = fmul double %3, 0.000000e+00
%18 = fadd double %17, %16
ret double %18
}

0 comments on commit 181b2c1

Please sign in to comment.