From: Hassnaa Hamdi Date: Thu, 2 Feb 2023 11:46:11 +0000 (+0000) Subject: [AArch64][CostModel]: Add costs for zero/sign extend. X-Git-Tag: upstream/17.0.6~18818 X-Git-Url: http://review.tizen.org/git/?a=commitdiff_plain;h=d65c3bf39aa49eda0f5a6bff02c9292895a37e26;p=platform%2Fupstream%2Fllvm.git [AArch64][CostModel]: Add costs for zero/sign extend. Add cost for extending to illegal scalable vector types. Add testing file for the extend operations. Reviewed By: sdesmalen Differential Revision: https://reviews.llvm.org/D142456 --- diff --git a/llvm/lib/Target/AArch64/AArch64TargetTransformInfo.cpp b/llvm/lib/Target/AArch64/AArch64TargetTransformInfo.cpp index c6e9e05..303ec8e 100644 --- a/llvm/lib/Target/AArch64/AArch64TargetTransformInfo.cpp +++ b/llvm/lib/Target/AArch64/AArch64TargetTransformInfo.cpp @@ -2072,6 +2072,23 @@ InstructionCost AArch64TTIImpl::getCastInstrCost(unsigned Opcode, Type *Dst, { ISD::BITCAST, MVT::nxv2i16, MVT::nxv2f16, 0 }, { ISD::BITCAST, MVT::nxv4i16, MVT::nxv4f16, 0 }, { ISD::BITCAST, MVT::nxv2i32, MVT::nxv2f32, 0 }, + + // Add cost for extending to illegal -too wide- scalable vectors. + // zero/sign extend are implemented by multiple unpack operations, + // where each operation has a cost of 1. + { ISD::ZERO_EXTEND, MVT::nxv16i16, MVT::nxv16i8, 2}, + { ISD::ZERO_EXTEND, MVT::nxv16i32, MVT::nxv16i8, 6}, + { ISD::ZERO_EXTEND, MVT::nxv16i64, MVT::nxv16i8, 14}, + { ISD::ZERO_EXTEND, MVT::nxv8i32, MVT::nxv8i16, 2}, + { ISD::ZERO_EXTEND, MVT::nxv8i64, MVT::nxv8i16, 6}, + { ISD::ZERO_EXTEND, MVT::nxv4i64, MVT::nxv4i32, 2}, + + { ISD::SIGN_EXTEND, MVT::nxv16i16, MVT::nxv16i8, 2}, + { ISD::SIGN_EXTEND, MVT::nxv16i32, MVT::nxv16i8, 6}, + { ISD::SIGN_EXTEND, MVT::nxv16i64, MVT::nxv16i8, 14}, + { ISD::SIGN_EXTEND, MVT::nxv8i32, MVT::nxv8i16, 2}, + { ISD::SIGN_EXTEND, MVT::nxv8i64, MVT::nxv8i16, 6}, + { ISD::SIGN_EXTEND, MVT::nxv4i64, MVT::nxv4i32, 2}, }; if (const auto *Entry = ConvertCostTableLookup(ConversionTbl, ISD, diff --git a/llvm/test/Analysis/CostModel/AArch64/cast.ll b/llvm/test/Analysis/CostModel/AArch64/cast.ll index 96906c3..665df75 100644 --- a/llvm/test/Analysis/CostModel/AArch64/cast.ll +++ b/llvm/test/Analysis/CostModel/AArch64/cast.ll @@ -858,8 +858,8 @@ define i32 @load_extends() #0 { ; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %v13 = zext <4 x i32> %loadv4i32 to <4 x i64> ; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v14 = sext %loadnxv2i32 to ; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %v15 = zext %loadnxv2i32 to -; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %v16 = sext %loadnxv4i32 to -; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %v17 = zext %loadnxv4i32 to +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %v16 = sext %loadnxv4i32 to +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %v17 = zext %loadnxv4i32 to ; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; %loadi8 = load i8, ptr undef diff --git a/llvm/test/Analysis/CostModel/AArch64/sve-ext.ll b/llvm/test/Analysis/CostModel/AArch64/sve-ext.ll new file mode 100644 index 0000000..1979be7 --- /dev/null +++ b/llvm/test/Analysis/CostModel/AArch64/sve-ext.ll @@ -0,0 +1,37 @@ +; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py +; RUN: opt -passes="print" 2>&1 -disable-output -mtriple aarch64-linux-gnu -mattr=+sve -S -o - < %s | FileCheck %s + +target triple = "aarch64-unknown-linux-gnu" + +define void @sve_ext() { +; CHECK-LABEL: 'sve_ext' +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %zext_nxv16_i8_to_i16 = zext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %zext_nxv16_i8_to_i32 = zext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %zext_nxv16_i8_to_i64 = zext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %zext_nxv8_i16_to_i32 = zext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %zext_nxv8_i16_to_i64 = zext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %zext_nxv4_i32_to_i64 = zext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %sext_nxv16_i8_to_i16 = sext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %sext_nxv16_i8_to_i32 = sext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %sext_nxv16_i8_to_i64 = sext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %sext_nxv8_i16_to_i32 = sext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %sext_nxv8_i16_to_i64 = sext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %sext_nxv4_i32_to_i64 = sext undef to +; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void +; + %zext_nxv16_i8_to_i16 = zext undef to + %zext_nxv16_i8_to_i32 = zext undef to + %zext_nxv16_i8_to_i64 = zext undef to + %zext_nxv8_i16_to_i32 = zext undef to + %zext_nxv8_i16_to_i64 = zext undef to + %zext_nxv4_i32_to_i64 = zext undef to + + %sext_nxv16_i8_to_i16 = sext undef to + %sext_nxv16_i8_to_i32 = sext undef to + %sext_nxv16_i8_to_i64 = sext undef to + %sext_nxv8_i16_to_i32 = sext undef to + %sext_nxv8_i16_to_i64 = sext undef to + %sext_nxv4_i32_to_i64 = sext undef to + + ret void +} diff --git a/llvm/test/Analysis/CostModel/AArch64/sve-widening-instruction.ll b/llvm/test/Analysis/CostModel/AArch64/sve-widening-instruction.ll index 45b2c77..4d354d9 100644 --- a/llvm/test/Analysis/CostModel/AArch64/sve-widening-instruction.ll +++ b/llvm/test/Analysis/CostModel/AArch64/sve-widening-instruction.ll @@ -20,8 +20,8 @@ define @widening_nxv4i16( %in1, @widening_nxv8i16( %in1, %in2) { ; CHECK-LABEL: 'widening_nxv8i16' -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %in1.ext = zext %in2 to -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %in2.ext = zext %in2 to +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %in1.ext = zext %in2 to +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %in2.ext = zext %in2 to ; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %in.add = add %in1.ext, %in2.ext ; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret %in.add ;