From f233b92f92a669f9f2cc6d08d57ca4931dd61b78 Mon Sep 17 00:00:00 2001 From: Hiroshi Yamauchi Date: Tue, 7 Jul 2020 11:13:55 -0700 Subject: [PATCH] [PGO][PGSO] Add profile guided size optimization to LegalizeDAG. Reviewers: davidxl Subscribers: hiraditya, llvm-commits Tags: #llvm Differential Revision: https://reviews.llvm.org/D83333 --- llvm/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp | 2 +- llvm/test/CodeGen/AArch64/arm64-fp-imm-size.ll | 35 ++++++++++++++++++++++++++ 2 files changed, 36 insertions(+), 1 deletion(-) diff --git a/llvm/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp b/llvm/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp index 5fff4c0..cbbcaf1 100644 --- a/llvm/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp @@ -3319,7 +3319,7 @@ bool SelectionDAGLegalize::ExpandNode(SDNode *Node) { // Check to see if this FP immediate is already legal. // If this is a legal constant, turn it into a TargetConstantFP node. if (!TLI.isFPImmLegal(CFP->getValueAPF(), Node->getValueType(0), - DAG.getMachineFunction().getFunction().hasOptSize())) + DAG.shouldOptForSize())) Results.push_back(ExpandConstantFP(CFP, true)); break; } diff --git a/llvm/test/CodeGen/AArch64/arm64-fp-imm-size.ll b/llvm/test/CodeGen/AArch64/arm64-fp-imm-size.ll index 5966fc6..58b025a 100644 --- a/llvm/test/CodeGen/AArch64/arm64-fp-imm-size.ll +++ b/llvm/test/CodeGen/AArch64/arm64-fp-imm-size.ll @@ -38,3 +38,38 @@ define fp128 @baz() optsize { ; CHECK-NEXT: ret ret fp128 0xL00000000000000000000000000000000 } + +; CHECK: literal8 +; CHECK: .quad 0x0000001fffffffd +define double @foo2_pgso() !prof !14 { +; CHECK: _foo2_pgso: +; CHECK: adrp x[[REG:[0-9]+]], lCPI4_0@PAGE +; CHECK: ldr d0, [x[[REG]], lCPI4_0@PAGEOFF] +; CHECK-NEXT: ret + ret double 0x1FFFFFFFd1 +} + +define float @bar_pgso() !prof !14 { +; CHECK: _bar_pgso: +; CHECK: adrp x[[REG:[0-9]+]], lCPI5_0@PAGE +; CHECK: ldr s0, [x[[REG]], lCPI5_0@PAGEOFF] +; CHECK-NEXT: ret + ret float 0x400921FB80000000 +} + +!llvm.module.flags = !{!0} +!0 = !{i32 1, !"ProfileSummary", !1} +!1 = !{!2, !3, !4, !5, !6, !7, !8, !9} +!2 = !{!"ProfileFormat", !"InstrProf"} +!3 = !{!"TotalCount", i64 10000} +!4 = !{!"MaxCount", i64 10} +!5 = !{!"MaxInternalCount", i64 1} +!6 = !{!"MaxFunctionCount", i64 1000} +!7 = !{!"NumCounts", i64 3} +!8 = !{!"NumFunctions", i64 3} +!9 = !{!"DetailedSummary", !10} +!10 = !{!11, !12, !13} +!11 = !{i32 10000, i64 100, i32 1} +!12 = !{i32 999000, i64 100, i32 1} +!13 = !{i32 999999, i64 1, i32 2} +!14 = !{!"function_entry_count", i64 0} -- 2.7.4