From 8bc790f9e6a6fc6d8fe8f41a7120269366fa0957 Mon Sep 17 00:00:00 2001 From: Diogo Sampaio Date: Sat, 15 Feb 2020 05:05:15 +0000 Subject: [PATCH] [AArch64][FPenv] Update chain of int to fp conversion Summary: When using strict fp, it is required to update the chain when performing integer type promotion of a operand to a integer to floating point conversion. Reviewers: craig.topper, john.brawn Reviewed By: craig.topper Subscribers: kristof.beyls, hiraditya, llvm-commits Tags: #llvm Differential Revision: https://reviews.llvm.org/D74597 --- .../CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp | 10 +++- llvm/test/CodeGen/AArch64/strict-fp-int-promote.ll | 67 ++++++++++++++++++++++ 2 files changed, 75 insertions(+), 2 deletions(-) create mode 100644 llvm/test/CodeGen/AArch64/strict-fp-int-promote.ll diff --git a/llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp b/llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp index 1c6ed3d4..8e55eaa 100644 --- a/llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp @@ -1242,7 +1242,6 @@ bool DAGTypeLegalizer::PromoteIntegerOperand(SDNode *N, unsigned OpNo) { LLVM_DEBUG(dbgs() << "Promote integer operand: "; N->dump(&DAG); dbgs() << "\n"); SDValue Res = SDValue(); - if (CustomLowerNode(N, N->getOperand(OpNo).getValueType(), false)) { LLVM_DEBUG(dbgs() << "Node has been custom lowered, done\n"); return false; @@ -1339,10 +1338,17 @@ bool DAGTypeLegalizer::PromoteIntegerOperand(SDNode *N, unsigned OpNo) { if (Res.getNode() == N) return true; - assert(Res.getValueType() == N->getValueType(0) && N->getNumValues() == 1 && + const bool IsStrictFp = N->isStrictFPOpcode(); + assert(Res.getValueType() == N->getValueType(0) && + N->getNumValues() == (IsStrictFp ? 2 : 1) && "Invalid operand expansion"); + LLVM_DEBUG(dbgs() << "Replacing: "; N->dump(&DAG); dbgs() << " with: "; + Res.dump()); ReplaceValueWith(SDValue(N, 0), Res); + if (IsStrictFp) + ReplaceValueWith(SDValue(N, 1), SDValue(Res.getNode(), 1)); + return false; } diff --git a/llvm/test/CodeGen/AArch64/strict-fp-int-promote.ll b/llvm/test/CodeGen/AArch64/strict-fp-int-promote.ll new file mode 100644 index 0000000..296f058 --- /dev/null +++ b/llvm/test/CodeGen/AArch64/strict-fp-int-promote.ll @@ -0,0 +1,67 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -O0 -o - %s | FileCheck %s +; RUN: llc -O3 -o - %s | FileCheck %s --check-prefix=SUBOPTIMAL +target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128" +target triple = "aarch64-arm-none-eabi" + +declare float @llvm.experimental.constrained.sitofp.f32.i32(i32, metadata, metadata) +declare float @llvm.experimental.constrained.sitofp.f32.i16(i16, metadata, metadata) +declare i1 @llvm.experimental.constrained.fcmp.f32(float, float, metadata, metadata) +declare float @llvm.experimental.constrained.uitofp.f32.i16(i16, metadata, metadata) + +define i32 @test() #0 { +; CHECK-LABEL: test: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: mov w8, #1 +; CHECK-NEXT: scvtf s0, w8 +; CHECK-NEXT: fcmp s0, s0 +; CHECK-NEXT: cset w0, eq +; CHECK-NEXT: ret +; +; SUBOPTIMAL-LABEL: test: +; SUBOPTIMAL: // %bb.0: // %entry +; SUBOPTIMAL-NEXT: mov w8, #1 +; SUBOPTIMAL-NEXT: scvtf s0, w8 +; SUBOPTIMAL-NEXT: mov w8, #1 +; SUBOPTIMAL-NEXT: scvtf s1, w8 +; SUBOPTIMAL-NEXT: fcmp s0, s1 +; SUBOPTIMAL-NEXT: cset w8, eq +; SUBOPTIMAL-NEXT: and w0, w8, #0x1 +; SUBOPTIMAL-NEXT: ret +entry: + %conv = call float @llvm.experimental.constrained.sitofp.f32.i32(i32 1, metadata !"round.tonearest", metadata !"fpexcept.strict") + %conv1 = call float @llvm.experimental.constrained.sitofp.f32.i16(i16 1, metadata !"round.tonearest", metadata !"fpexcept.strict") + %cmp = call i1 @llvm.experimental.constrained.fcmp.f32(float %conv, float %conv1, metadata !"oeq", metadata !"fpexcept.strict") + %conv2 = zext i1 %cmp to i32 + ret i32 %conv2 +} + +define i32 @test2() #0 { +; CHECK-LABEL: test2: +; CHECK: // %bb.0: // %entry +; CHECK-NEXT: mov w8, #1 +; CHECK-NEXT: scvtf s0, w8 +; CHECK-NEXT: ucvtf s1, w8 +; CHECK-NEXT: fcmp s0, s1 +; CHECK-NEXT: cset w0, eq +; CHECK-NEXT: ret +; +; SUBOPTIMAL-LABEL: test2: +; SUBOPTIMAL: // %bb.0: // %entry +; SUBOPTIMAL-NEXT: mov w8, #1 +; SUBOPTIMAL-NEXT: scvtf s0, w8 +; SUBOPTIMAL-NEXT: mov w8, #1 +; SUBOPTIMAL-NEXT: ucvtf s1, w8 +; SUBOPTIMAL-NEXT: fcmp s0, s1 +; SUBOPTIMAL-NEXT: cset w8, eq +; SUBOPTIMAL-NEXT: and w0, w8, #0x1 +; SUBOPTIMAL-NEXT: ret +entry: + %conv = call float @llvm.experimental.constrained.sitofp.f32.i32(i32 1, metadata !"round.tonearest", metadata !"fpexcept.strict") + %conv1 = call float @llvm.experimental.constrained.uitofp.f32.i16(i16 1, metadata !"round.tonearest", metadata !"fpexcept.strict") + %cmp = call i1 @llvm.experimental.constrained.fcmp.f32(float %conv, float %conv1, metadata !"oeq", metadata !"fpexcept.strict") + %conv2 = zext i1 %cmp to i32 + ret i32 %conv2 +} + +attributes #0 = { noinline optnone } -- 2.7.4