From: Quentin Colombet Date: Fri, 11 Oct 2019 20:22:57 +0000 (+0000) Subject: [GISel][CallLowering] Enable vector support in argument lowering X-Git-Tag: llvmorg-11-init~6740 X-Git-Url: http://review.tizen.org/git/?a=commitdiff_plain;h=9c36ec5941730364d4b9befd15e20365a039a2f1;p=platform%2Fupstream%2Fllvm.git [GISel][CallLowering] Enable vector support in argument lowering The exciting code is actually already enough to handle the splitting of vector arguments but we were lacking a test case. This commit adds a test case for vector argument lowering involving splitting and enable the related support in call lowering. llvm-svn: 374589 --- diff --git a/llvm/lib/CodeGen/GlobalISel/CallLowering.cpp b/llvm/lib/CodeGen/GlobalISel/CallLowering.cpp index d05e209..ed4d225 100644 --- a/llvm/lib/CodeGen/GlobalISel/CallLowering.cpp +++ b/llvm/lib/CodeGen/GlobalISel/CallLowering.cpp @@ -198,14 +198,12 @@ bool CallLowering::handleAssignments(CCState &CCInfo, unsigned NumParts = TLI->getNumRegistersForCallingConv( F.getContext(), F.getCallingConv(), CurVT); if (NumParts > 1) { - if (CurVT.isVector()) - return false; // For now only handle exact splits. if (NewVT.getSizeInBits() * NumParts != CurVT.getSizeInBits()) return false; } - // For incoming arguments (return values), we could have values in + // For incoming arguments (physregs to vregs), we could have values in // physregs (or memlocs) which we want to extract and copy to vregs. // During this, we might have to deal with the LLT being split across // multiple regs, so we have to record this information for later. @@ -221,7 +219,7 @@ bool CallLowering::handleAssignments(CCState &CCInfo, return false; } else { // We're handling an incoming arg which is split over multiple regs. - // E.g. returning an s128 on AArch64. + // E.g. passing an s128 on AArch64. ISD::ArgFlagsTy OrigFlags = Args[i].Flags[0]; Args[i].OrigRegs.push_back(Args[i].Regs[0]); Args[i].Regs.clear(); diff --git a/llvm/test/CodeGen/AArch64/GlobalISel/irtranslator-split-vector-arg.ll b/llvm/test/CodeGen/AArch64/GlobalISel/irtranslator-split-vector-arg.ll new file mode 100644 index 0000000..ef74cdb --- /dev/null +++ b/llvm/test/CodeGen/AArch64/GlobalISel/irtranslator-split-vector-arg.ll @@ -0,0 +1,22 @@ +; NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py +; RUN: llc -global-isel -global-isel-abort=1 %s -stop-after=irtranslator -o - | FileCheck %s +target triple = "aarch64-apple-ios" + +; Check that we correctly split %arg into two vector registers of +; size <2 x i64>. +define hidden fastcc <4 x float> @foo(<4 x i64> %arg) unnamed_addr #0 { + ; CHECK-LABEL: name: foo + ; CHECK: bb.1.bb: + ; CHECK: liveins: $q0, $q1 + ; CHECK: [[COPY:%[0-9]+]]:_(<2 x s64>) = COPY $q0 + ; CHECK: [[COPY1:%[0-9]+]]:_(<2 x s64>) = COPY $q1 + ; CHECK: [[CONCAT_VECTORS:%[0-9]+]]:_(<4 x s64>) = G_CONCAT_VECTORS [[COPY]](<2 x s64>), [[COPY1]](<2 x s64>) + ; CHECK: [[UITOFP:%[0-9]+]]:_(<4 x s32>) = G_UITOFP [[CONCAT_VECTORS]](<4 x s64>) + ; CHECK: $q0 = COPY [[UITOFP]](<4 x s32>) + ; CHECK: RET_ReallyLR implicit $q0 +bb: + %tmp = uitofp <4 x i64> %arg to <4 x float> + ret <4 x float> %tmp +} + +attributes #0 = { nounwind readnone }