From: Tom Stellard Date: Fri, 11 May 2018 05:44:16 +0000 (+0000) Subject: AMDGPU/GlobalISel: Implement select() for 32-bit G_FPTOUI X-Git-Tag: llvmorg-7.0.0-rc1~6249 X-Git-Url: http://review.tizen.org/git/?a=commitdiff_plain;h=dcc95e938562421aac93cb4c41714d6a260f595e;p=platform%2Fupstream%2Fllvm.git AMDGPU/GlobalISel: Implement select() for 32-bit G_FPTOUI Reviewers: arsenm, nhaehnle Subscribers: kzhuravl, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, llvm-commits Differential Revision: https://reviews.llvm.org/D45883 llvm-svn: 332082 --- diff --git a/llvm/lib/Target/AMDGPU/AMDGPUGISel.td b/llvm/lib/Target/AMDGPU/AMDGPUGISel.td index 74b73de..c9dfbaf 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPUGISel.td +++ b/llvm/lib/Target/AMDGPU/AMDGPUGISel.td @@ -18,6 +18,10 @@ def gi_vsrc0 : GIComplexOperandMatcher, GIComplexPatternEquiv; +def gi_vop3mods0 : + GIComplexOperandMatcher, + GIComplexPatternEquiv; + class GISelSop2Pat < SDPatternOperator node, Instruction inst, diff --git a/llvm/lib/Target/AMDGPU/AMDGPUInstructionSelector.cpp b/llvm/lib/Target/AMDGPU/AMDGPUInstructionSelector.cpp index 085a9c2..52ecca7 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPUInstructionSelector.cpp +++ b/llvm/lib/Target/AMDGPU/AMDGPUInstructionSelector.cpp @@ -455,6 +455,7 @@ bool AMDGPUInstructionSelector::select(MachineInstr &I, switch (I.getOpcode()) { default: break; + case TargetOpcode::G_FPTOUI: case TargetOpcode::G_OR: return selectImpl(I, CoverageInfo); case TargetOpcode::G_ADD: @@ -482,3 +483,13 @@ AMDGPUInstructionSelector::selectVSRC0(MachineOperand &Root) const { [=](MachineInstrBuilder &MIB) { MIB.add(Root); } }}; } + +InstructionSelector::ComplexRendererFns +AMDGPUInstructionSelector::selectVOP3Mods0(MachineOperand &Root) const { + return {{ + [=](MachineInstrBuilder &MIB) { MIB.add(Root); }, + [=](MachineInstrBuilder &MIB) { MIB.addImm(0); }, // src0_mods + [=](MachineInstrBuilder &MIB) { MIB.addImm(0); }, // clamp + [=](MachineInstrBuilder &MIB) { MIB.addImm(0); } // omod + }}; +} diff --git a/llvm/lib/Target/AMDGPU/AMDGPUInstructionSelector.h b/llvm/lib/Target/AMDGPU/AMDGPUInstructionSelector.h index f9ab4d0..cdad743 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPUInstructionSelector.h +++ b/llvm/lib/Target/AMDGPU/AMDGPUInstructionSelector.h @@ -73,6 +73,9 @@ private: InstructionSelector::ComplexRendererFns selectVSRC0(MachineOperand &Root) const; + InstructionSelector::ComplexRendererFns + selectVOP3Mods0(MachineOperand &Root) const; + const SIInstrInfo &TII; const SIRegisterInfo &TRI; const AMDGPURegisterBankInfo &RBI; diff --git a/llvm/test/CodeGen/AMDGPU/GlobalISel/inst-select-fptoui.mir b/llvm/test/CodeGen/AMDGPU/GlobalISel/inst-select-fptoui.mir new file mode 100644 index 0000000..07f19c4 --- /dev/null +++ b/llvm/test/CodeGen/AMDGPU/GlobalISel/inst-select-fptoui.mir @@ -0,0 +1,36 @@ +# RUN: llc -march=amdgcn -run-pass=instruction-select -verify-machineinstrs -global-isel %s -o - | FileCheck %s -check-prefixes=GCN + +--- | + define amdgpu_kernel void @fptoui(i32 addrspace(1)* %global0) {ret void} +... +--- + +name: fptoui +legalized: true +regBankSelected: true + +# GCN-LABEL: name: fptoui +body: | + bb.0: + liveins: $sgpr0, $vgpr0, $vgpr3_vgpr4 + + ; GCN: [[SGPR:%[0-9]+]]:sreg_32_xm0 = COPY $sgpr0 + %0:sgpr(s32) = COPY $sgpr0 + + ; GCN: [[VGPR:%[0-9]+]]:vgpr_32 = COPY $vgpr0 + %1:vgpr(s32) = COPY $vgpr0 + + %2:vgpr(s64) = COPY $vgpr3_vgpr4 + + ; fptoui s + ; GCN: V_CVT_U32_F32_e64 0, [[SGPR]], 0, 0 + %3:vgpr(s32) = G_FPTOUI %0 + + ; fptoui v + ; GCN: V_CVT_U32_F32_e64 0, [[VGPR]], 0, 0 + %4:vgpr(s32) = G_FPTOUI %1 + + G_STORE %3, %2 :: (store 4 into %ir.global0) + G_STORE %4, %2 :: (store 4 into %ir.global0) +... +---