diff --git a/llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp b/llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp index 1f069cb9eb514..ed7a040dac90c 100644 --- a/llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp +++ b/llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp @@ -1463,8 +1463,26 @@ InstructionCost RISCVTTIImpl::getVectorInstrCost(unsigned Opcode, Type *Val, std::pair LT = getTypeLegalizationCost(Val); // This type is legalized to a scalar type. - if (!LT.second.isVector()) - return 0; + if (!LT.second.isVector()) { + auto *FixedVecTy = cast(Val); + // If Index is a known constant, cost is zero. + if (Index != -1U) + return 0; + // Extract/InsertElement with non-constant index is very costly when + // scalarized; estimate cost of loads/stores sequence via the stack: + // ExtractElement cost: store vector to stack, load scalar; + // InsertElement cost: store vector to stack, store scalar, load vector. + Type *ElemTy = FixedVecTy->getElementType(); + auto NumElems = FixedVecTy->getNumElements(); + auto Align = DL.getPrefTypeAlign(ElemTy); + InstructionCost LoadCost = + getMemoryOpCost(Instruction::Load, ElemTy, Align, 0, CostKind); + InstructionCost StoreCost = + getMemoryOpCost(Instruction::Store, ElemTy, Align, 0, CostKind); + return Opcode == Instruction::ExtractElement + ? StoreCost * NumElems + LoadCost + : (StoreCost + LoadCost) * NumElems + StoreCost; + } // For unsupported scalable vector. if (LT.second.isScalableVector() && !LT.first.isValid()) diff --git a/llvm/test/Analysis/CostModel/RISCV/extractelement.ll b/llvm/test/Analysis/CostModel/RISCV/extractelement.ll new file mode 100644 index 0000000000000..83d74bf6840c3 --- /dev/null +++ b/llvm/test/Analysis/CostModel/RISCV/extractelement.ll @@ -0,0 +1,135 @@ +; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py UTC_ARGS: --version 3 +; RUN: opt -passes="print" 2>&1 -disable-output -mtriple=riscv32 -mattr=+f,+d,+zfh < %s | FileCheck %s --check-prefixes=RV32 +; RUN: opt -passes="print" 2>&1 -disable-output -mtriple=riscv64 -mattr=+f,+d,+zfh < %s | FileCheck %s --check-prefixes=RV64 + +define void @extractelement_int(i32 %x) { +; RV32-LABEL: 'extractelement_int' +; RV32-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2i8 = extractelement <2 x i8> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4i8 = extractelement <4 x i8> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8i8 = extractelement <8 x i8> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16i8 = extractelement <16 x i8> undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16i8 = extractelement undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2i16 = extractelement <2 x i16> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4i16 = extractelement <4 x i16> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8i16 = extractelement <8 x i16> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16i16 = extractelement <16 x i16> undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16i16 = extractelement undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2i32 = extractelement <2 x i32> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4i32 = extractelement <4 x i32> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8i32 = extractelement <8 x i32> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16i32 = extractelement <16 x i32> undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16i32 = extractelement undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %v2i64 = extractelement <2 x i64> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %v4i64 = extractelement <4 x i64> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %v8i64 = extractelement <8 x i64> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %v16i64 = extractelement <16 x i64> undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16i64 = extractelement undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void +; +; RV64-LABEL: 'extractelement_int' +; RV64-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2i8 = extractelement <2 x i8> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4i8 = extractelement <4 x i8> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8i8 = extractelement <8 x i8> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16i8 = extractelement <16 x i8> undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16i8 = extractelement undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2i16 = extractelement <2 x i16> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4i16 = extractelement <4 x i16> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8i16 = extractelement <8 x i16> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16i16 = extractelement <16 x i16> undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16i16 = extractelement undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2i32 = extractelement <2 x i32> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4i32 = extractelement <4 x i32> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8i32 = extractelement <8 x i32> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16i32 = extractelement <16 x i32> undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16i32 = extractelement undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2i64 = extractelement <2 x i64> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4i64 = extractelement <4 x i64> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8i64 = extractelement <8 x i64> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16i64 = extractelement <16 x i64> undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16i64 = extractelement undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void +; + %v2i8 = extractelement <2 x i8> undef, i32 %x + %v4i8 = extractelement <4 x i8> undef, i32 %x + %v8i8 = extractelement <8 x i8> undef, i32 %x + %v16i8 = extractelement <16 x i8> undef, i32 %x + %nxv16i8 = extractelement undef, i32 %x + + %v2i16 = extractelement <2 x i16> undef, i32 %x + %v4i16 = extractelement <4 x i16> undef, i32 %x + %v8i16 = extractelement <8 x i16> undef, i32 %x + %v16i16 = extractelement <16 x i16> undef, i32 %x + %nxv16i16 = extractelement undef, i32 %x + + %v2i32 = extractelement <2 x i32> undef, i32 %x + %v4i32 = extractelement <4 x i32> undef, i32 %x + %v8i32 = extractelement <8 x i32> undef, i32 %x + %v16i32 = extractelement <16 x i32> undef, i32 %x + %nxv16i32 = extractelement undef, i32 %x + + %v2i64 = extractelement <2 x i64> undef, i32 %x + %v4i64 = extractelement <4 x i64> undef, i32 %x + %v8i64 = extractelement <8 x i64> undef, i32 %x + %v16i64 = extractelement <16 x i64> undef, i32 %x + %nxv16i64 = extractelement undef, i32 %x + + ret void +} + +define void @extractelement_fp(i32 %x) { +; RV32-LABEL: 'extractelement_fp' +; RV32-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f16 = extractelement <2 x half> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f16 = extractelement <4 x half> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f16 = extractelement <8 x half> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f16 = extractelement <16 x half> undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16f16 = extractelement undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f32 = extractelement <2 x float> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f32 = extractelement <4 x float> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f32 = extractelement <8 x float> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f32 = extractelement <16 x float> undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16f32 = extractelement undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f64 = extractelement <2 x double> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f64 = extractelement <4 x double> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f64 = extractelement <8 x double> undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f64 = extractelement <16 x double> undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16f64 = extractelement undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void +; +; RV64-LABEL: 'extractelement_fp' +; RV64-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f16 = extractelement <2 x half> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f16 = extractelement <4 x half> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f16 = extractelement <8 x half> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f16 = extractelement <16 x half> undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16f16 = extractelement undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f32 = extractelement <2 x float> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f32 = extractelement <4 x float> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f32 = extractelement <8 x float> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f32 = extractelement <16 x float> undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16f32 = extractelement undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f64 = extractelement <2 x double> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f64 = extractelement <4 x double> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f64 = extractelement <8 x double> undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f64 = extractelement <16 x double> undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16f64 = extractelement undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void +; + %v2f16 = extractelement <2 x half> undef, i32 %x + %v4f16 = extractelement <4 x half> undef, i32 %x + %v8f16 = extractelement <8 x half> undef, i32 %x + %v16f16 = extractelement <16 x half> undef, i32 %x + %nxv16f16 = extractelement undef, i32 %x + + %v2f32 = extractelement <2 x float> undef, i32 %x + %v4f32 = extractelement <4 x float> undef, i32 %x + %v8f32 = extractelement <8 x float> undef, i32 %x + %v16f32 = extractelement <16 x float> undef, i32 %x + %nxv16f32 = extractelement undef, i32 %x + + %v2f64 = extractelement <2 x double> undef, i32 %x + %v4f64 = extractelement <4 x double> undef, i32 %x + %v8f64 = extractelement <8 x double> undef, i32 %x + %v16f64 = extractelement <16 x double> undef, i32 %x + %nxv16f64 = extractelement undef, i32 %x + + ret void +} diff --git a/llvm/test/Analysis/CostModel/RISCV/insertelement.ll b/llvm/test/Analysis/CostModel/RISCV/insertelement.ll new file mode 100644 index 0000000000000..6a57d15867733 --- /dev/null +++ b/llvm/test/Analysis/CostModel/RISCV/insertelement.ll @@ -0,0 +1,135 @@ +; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py UTC_ARGS: --version 3 +; RUN: opt -passes="print" 2>&1 -disable-output -mtriple=riscv32 -mattr=+f,+d,+zfh < %s | FileCheck %s --check-prefixes=RV32 +; RUN: opt -passes="print" 2>&1 -disable-output -mtriple=riscv64 -mattr=+f,+d,+zfh < %s | FileCheck %s --check-prefixes=RV64 + +define void @insertelement_int(i32 %x) { +; RV32-LABEL: 'insertelement_int' +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2i8 = insertelement <2 x i8> undef, i8 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4i8 = insertelement <4 x i8> undef, i8 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8i8 = insertelement <8 x i8> undef, i8 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16i8 = insertelement <16 x i8> undef, i8 undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16i8 = insertelement undef, i8 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2i16 = insertelement <2 x i16> undef, i16 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4i16 = insertelement <4 x i16> undef, i16 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8i16 = insertelement <8 x i16> undef, i16 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16i16 = insertelement <16 x i16> undef, i16 undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16i16 = insertelement undef, i16 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2i32 = insertelement <2 x i32> undef, i32 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4i32 = insertelement <4 x i32> undef, i32 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8i32 = insertelement <8 x i32> undef, i32 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16i32 = insertelement <16 x i32> undef, i32 undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16i32 = insertelement undef, i32 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %v2i64 = insertelement <2 x i64> undef, i64 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %v4i64 = insertelement <4 x i64> undef, i64 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %v8i64 = insertelement <8 x i64> undef, i64 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %v16i64 = insertelement <16 x i64> undef, i64 undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16i64 = insertelement undef, i64 undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void +; +; RV64-LABEL: 'insertelement_int' +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2i8 = insertelement <2 x i8> undef, i8 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4i8 = insertelement <4 x i8> undef, i8 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8i8 = insertelement <8 x i8> undef, i8 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16i8 = insertelement <16 x i8> undef, i8 undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16i8 = insertelement undef, i8 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2i16 = insertelement <2 x i16> undef, i16 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4i16 = insertelement <4 x i16> undef, i16 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8i16 = insertelement <8 x i16> undef, i16 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16i16 = insertelement <16 x i16> undef, i16 undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16i16 = insertelement undef, i16 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2i32 = insertelement <2 x i32> undef, i32 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4i32 = insertelement <4 x i32> undef, i32 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8i32 = insertelement <8 x i32> undef, i32 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16i32 = insertelement <16 x i32> undef, i32 undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16i32 = insertelement undef, i32 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2i64 = insertelement <2 x i64> undef, i64 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4i64 = insertelement <4 x i64> undef, i64 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8i64 = insertelement <8 x i64> undef, i64 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16i64 = insertelement <16 x i64> undef, i64 undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16i64 = insertelement undef, i64 undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void +; + %v2i8 = insertelement <2 x i8> undef, i8 undef, i32 %x + %v4i8 = insertelement <4 x i8> undef, i8 undef, i32 %x + %v8i8 = insertelement <8 x i8> undef, i8 undef, i32 %x + %v16i8 = insertelement <16 x i8> undef, i8 undef, i32 %x + %nxv16i8 = insertelement undef, i8 undef, i32 %x + + %v2i16 = insertelement <2 x i16> undef, i16 undef, i32 %x + %v4i16 = insertelement <4 x i16> undef, i16 undef, i32 %x + %v8i16 = insertelement <8 x i16> undef, i16 undef, i32 %x + %v16i16 = insertelement <16 x i16> undef, i16 undef, i32 %x + %nxv16i16 = insertelement undef, i16 undef, i32 %x + + %v2i32 = insertelement <2 x i32> undef, i32 undef, i32 %x + %v4i32 = insertelement <4 x i32> undef, i32 undef, i32 %x + %v8i32 = insertelement <8 x i32> undef, i32 undef, i32 %x + %v16i32 = insertelement <16 x i32> undef, i32 undef, i32 %x + %nxv16i32 = insertelement undef, i32 undef, i32 %x + + %v2i64 = insertelement <2 x i64> undef, i64 undef, i32 %x + %v4i64 = insertelement <4 x i64> undef, i64 undef, i32 %x + %v8i64 = insertelement <8 x i64> undef, i64 undef, i32 %x + %v16i64 = insertelement <16 x i64> undef, i64 undef, i32 %x + %nxv16i64 = insertelement undef, i64 undef, i32 %x + + ret void +} + +define void @insertelement_fp(i32 %x) { +; RV32-LABEL: 'insertelement_fp' +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f16 = insertelement <2 x half> undef, half undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f16 = insertelement <4 x half> undef, half undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f16 = insertelement <8 x half> undef, half undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f16 = insertelement <16 x half> undef, half undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16f16 = insertelement undef, half undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f32 = insertelement <2 x float> undef, float undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f32 = insertelement <4 x float> undef, float undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f32 = insertelement <8 x float> undef, float undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f32 = insertelement <16 x float> undef, float undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16f32 = insertelement undef, float undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f64 = insertelement <2 x double> undef, double undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f64 = insertelement <4 x double> undef, double undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f64 = insertelement <8 x double> undef, double undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f64 = insertelement <16 x double> undef, double undef, i32 %x +; RV32-NEXT: Cost Model: Invalid cost for instruction: %nxv16f64 = insertelement undef, double undef, i32 %x +; RV32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void +; +; RV64-LABEL: 'insertelement_fp' +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f16 = insertelement <2 x half> undef, half undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f16 = insertelement <4 x half> undef, half undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f16 = insertelement <8 x half> undef, half undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f16 = insertelement <16 x half> undef, half undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16f16 = insertelement undef, half undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f32 = insertelement <2 x float> undef, float undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f32 = insertelement <4 x float> undef, float undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f32 = insertelement <8 x float> undef, float undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f32 = insertelement <16 x float> undef, float undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16f32 = insertelement undef, float undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f64 = insertelement <2 x double> undef, double undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f64 = insertelement <4 x double> undef, double undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f64 = insertelement <8 x double> undef, double undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f64 = insertelement <16 x double> undef, double undef, i32 %x +; RV64-NEXT: Cost Model: Invalid cost for instruction: %nxv16f64 = insertelement undef, double undef, i32 %x +; RV64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void +; + %v2f16 = insertelement <2 x half> undef, half undef, i32 %x + %v4f16 = insertelement <4 x half> undef, half undef, i32 %x + %v8f16 = insertelement <8 x half> undef, half undef, i32 %x + %v16f16 = insertelement <16 x half> undef, half undef, i32 %x + %nxv16f16 = insertelement undef, half undef, i32 %x + + %v2f32 = insertelement <2 x float> undef, float undef, i32 %x + %v4f32 = insertelement <4 x float> undef, float undef, i32 %x + %v8f32 = insertelement <8 x float> undef, float undef, i32 %x + %v16f32 = insertelement <16 x float> undef, float undef, i32 %x + %nxv16f32 = insertelement undef, float undef, i32 %x + + %v2f64 = insertelement <2 x double> undef, double undef, i32 %x + %v4f64 = insertelement <4 x double> undef, double undef, i32 %x + %v8f64 = insertelement <8 x double> undef, double undef, i32 %x + %v16f64 = insertelement <16 x double> undef, double undef, i32 %x + %nxv16f64 = insertelement undef, double undef, i32 %x + + ret void +} diff --git a/llvm/test/Analysis/CostModel/RISCV/rvv-extractelement.ll b/llvm/test/Analysis/CostModel/RISCV/rvv-extractelement.ll index e33beaac4f421..225bad6da5915 100644 --- a/llvm/test/Analysis/CostModel/RISCV/rvv-extractelement.ll +++ b/llvm/test/Analysis/CostModel/RISCV/rvv-extractelement.ll @@ -1202,32 +1202,32 @@ define void @extractelement_fp(i32 %x) { ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f64_1 = extractelement undef, i32 1 ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f64_1 = extractelement undef, i32 1 ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f64_1 = extractelement undef, i32 1 -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f16_x = extractelement <2 x half> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f16_x = extractelement <4 x half> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f16_x = extractelement <8 x half> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f16_x = extractelement <16 x half> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v32f16_x = extractelement <32 x half> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v64f16_x = extractelement <64 x half> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f16_x = extractelement <2 x half> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f16_x = extractelement <4 x half> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f16_x = extractelement <8 x half> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f16_x = extractelement <16 x half> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v32f16_x = extractelement <32 x half> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %v64f16_x = extractelement <64 x half> undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f16_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f16_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f16_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f16_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv32f16_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv64f16_x = extractelement undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f32_x = extractelement <2 x float> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f32_x = extractelement <4 x float> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f32_x = extractelement <8 x float> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f32_x = extractelement <16 x float> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v32f32_x = extractelement <32 x float> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f32_x = extractelement <2 x float> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f32_x = extractelement <4 x float> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f32_x = extractelement <8 x float> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f32_x = extractelement <16 x float> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v32f32_x = extractelement <32 x float> undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f32_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f32_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f32_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f32_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv32f32_x = extractelement undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f64_x = extractelement <2 x double> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f64_x = extractelement <4 x double> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f64_x = extractelement <8 x double> undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f64_x = extractelement <16 x double> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %v2f64_x = extractelement <2 x double> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %v4f64_x = extractelement <4 x double> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %v8f64_x = extractelement <8 x double> undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %v16f64_x = extractelement <16 x double> undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f64_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f64_x = extractelement undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f64_x = extractelement undef, i32 %x @@ -1295,32 +1295,32 @@ define void @extractelement_fp(i32 %x) { ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f64_1 = extractelement undef, i32 1 ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f64_1 = extractelement undef, i32 1 ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f64_1 = extractelement undef, i32 1 -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f16_x = extractelement <2 x half> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f16_x = extractelement <4 x half> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f16_x = extractelement <8 x half> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f16_x = extractelement <16 x half> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v32f16_x = extractelement <32 x half> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v64f16_x = extractelement <64 x half> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f16_x = extractelement <2 x half> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f16_x = extractelement <4 x half> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f16_x = extractelement <8 x half> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f16_x = extractelement <16 x half> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v32f16_x = extractelement <32 x half> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %v64f16_x = extractelement <64 x half> undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f16_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f16_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f16_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f16_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv32f16_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv64f16_x = extractelement undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f32_x = extractelement <2 x float> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f32_x = extractelement <4 x float> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f32_x = extractelement <8 x float> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f32_x = extractelement <16 x float> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v32f32_x = extractelement <32 x float> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f32_x = extractelement <2 x float> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f32_x = extractelement <4 x float> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f32_x = extractelement <8 x float> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f32_x = extractelement <16 x float> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v32f32_x = extractelement <32 x float> undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f32_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f32_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f32_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f32_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv32f32_x = extractelement undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f64_x = extractelement <2 x double> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f64_x = extractelement <4 x double> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f64_x = extractelement <8 x double> undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f64_x = extractelement <16 x double> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %v2f64_x = extractelement <2 x double> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v4f64_x = extractelement <4 x double> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v8f64_x = extractelement <8 x double> undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v16f64_x = extractelement <16 x double> undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f64_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f64_x = extractelement undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f64_x = extractelement undef, i32 %x diff --git a/llvm/test/Analysis/CostModel/RISCV/rvv-insertelement.ll b/llvm/test/Analysis/CostModel/RISCV/rvv-insertelement.ll index a193857e6e0f8..5387c8dc35940 100644 --- a/llvm/test/Analysis/CostModel/RISCV/rvv-insertelement.ll +++ b/llvm/test/Analysis/CostModel/RISCV/rvv-insertelement.ll @@ -1202,32 +1202,32 @@ define void @insertelement_fp(i32 %x) { ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f64_1 = insertelement undef, double undef, i32 1 ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f64_1 = insertelement undef, double undef, i32 1 ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f64_1 = insertelement undef, double undef, i32 1 -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f16_x = insertelement <2 x half> undef, half undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f16_x = insertelement <4 x half> undef, half undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f16_x = insertelement <8 x half> undef, half undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f16_x = insertelement <16 x half> undef, half undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v32f16_x = insertelement <32 x half> undef, half undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v64f16_x = insertelement <64 x half> undef, half undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f16_x = insertelement <2 x half> undef, half undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f16_x = insertelement <4 x half> undef, half undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f16_x = insertelement <8 x half> undef, half undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f16_x = insertelement <16 x half> undef, half undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %v32f16_x = insertelement <32 x half> undef, half undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 129 for instruction: %v64f16_x = insertelement <64 x half> undef, half undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f16_x = insertelement undef, half undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f16_x = insertelement undef, half undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f16_x = insertelement undef, half undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f16_x = insertelement undef, half undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv32f16_x = insertelement undef, half undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv64f16_x = insertelement undef, half undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f32_x = insertelement <2 x float> undef, float undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f32_x = insertelement <4 x float> undef, float undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f32_x = insertelement <8 x float> undef, float undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f32_x = insertelement <16 x float> undef, float undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v32f32_x = insertelement <32 x float> undef, float undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f32_x = insertelement <2 x float> undef, float undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f32_x = insertelement <4 x float> undef, float undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f32_x = insertelement <8 x float> undef, float undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f32_x = insertelement <16 x float> undef, float undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %v32f32_x = insertelement <32 x float> undef, float undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f32_x = insertelement undef, float undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f32_x = insertelement undef, float undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f32_x = insertelement undef, float undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f32_x = insertelement undef, float undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv32f32_x = insertelement undef, float undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f64_x = insertelement <2 x double> undef, double undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f64_x = insertelement <4 x double> undef, double undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f64_x = insertelement <8 x double> undef, double undef, i32 %x -; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f64_x = insertelement <16 x double> undef, double undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %v2f64_x = insertelement <2 x double> undef, double undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %v4f64_x = insertelement <4 x double> undef, double undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %v8f64_x = insertelement <8 x double> undef, double undef, i32 %x +; RV32ZVE64X-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %v16f64_x = insertelement <16 x double> undef, double undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f64_x = insertelement undef, double undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f64_x = insertelement undef, double undef, i32 %x ; RV32ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f64_x = insertelement undef, double undef, i32 %x @@ -1295,32 +1295,32 @@ define void @insertelement_fp(i32 %x) { ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f64_1 = insertelement undef, double undef, i32 1 ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f64_1 = insertelement undef, double undef, i32 1 ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f64_1 = insertelement undef, double undef, i32 1 -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f16_x = insertelement <2 x half> undef, half undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f16_x = insertelement <4 x half> undef, half undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f16_x = insertelement <8 x half> undef, half undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f16_x = insertelement <16 x half> undef, half undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v32f16_x = insertelement <32 x half> undef, half undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v64f16_x = insertelement <64 x half> undef, half undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f16_x = insertelement <2 x half> undef, half undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f16_x = insertelement <4 x half> undef, half undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f16_x = insertelement <8 x half> undef, half undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f16_x = insertelement <16 x half> undef, half undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %v32f16_x = insertelement <32 x half> undef, half undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 129 for instruction: %v64f16_x = insertelement <64 x half> undef, half undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f16_x = insertelement undef, half undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f16_x = insertelement undef, half undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f16_x = insertelement undef, half undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f16_x = insertelement undef, half undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv32f16_x = insertelement undef, half undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv64f16_x = insertelement undef, half undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f32_x = insertelement <2 x float> undef, float undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f32_x = insertelement <4 x float> undef, float undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f32_x = insertelement <8 x float> undef, float undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f32_x = insertelement <16 x float> undef, float undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v32f32_x = insertelement <32 x float> undef, float undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f32_x = insertelement <2 x float> undef, float undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f32_x = insertelement <4 x float> undef, float undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f32_x = insertelement <8 x float> undef, float undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f32_x = insertelement <16 x float> undef, float undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %v32f32_x = insertelement <32 x float> undef, float undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f32_x = insertelement undef, float undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f32_x = insertelement undef, float undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f32_x = insertelement undef, float undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv16f32_x = insertelement undef, float undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv32f32_x = insertelement undef, float undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v2f64_x = insertelement <2 x double> undef, double undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v4f64_x = insertelement <4 x double> undef, double undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v8f64_x = insertelement <8 x double> undef, double undef, i32 %x -; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v16f64_x = insertelement <16 x double> undef, double undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %v2f64_x = insertelement <2 x double> undef, double undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %v4f64_x = insertelement <4 x double> undef, double undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %v8f64_x = insertelement <8 x double> undef, double undef, i32 %x +; RV64ZVE64X-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %v16f64_x = insertelement <16 x double> undef, double undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv2f64_x = insertelement undef, double undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv4f64_x = insertelement undef, double undef, i32 %x ; RV64ZVE64X-NEXT: Cost Model: Invalid cost for instruction: %nxv8f64_x = insertelement undef, double undef, i32 %x