From: Sjoerd Meijer Date: Wed, 23 Jun 2021 12:40:46 +0000 (+0100) Subject: [AArch64] Precommit extending load tests for D104782. NFC. X-Git-Tag: llvmorg-14-init~3114 X-Git-Url: http://review.tizen.org/git/?a=commitdiff_plain;h=c74aea46634347e2ad20111271faebec2da38af3;p=platform%2Fupstream%2Fllvm.git [AArch64] Precommit extending load tests for D104782. NFC. --- diff --git a/llvm/test/CodeGen/AArch64/neon-extload.ll b/llvm/test/CodeGen/AArch64/neon-extload.ll new file mode 100644 index 0000000..321a1ba --- /dev/null +++ b/llvm/test/CodeGen/AArch64/neon-extload.ll @@ -0,0 +1,145 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc < %s -verify-machineinstrs -mtriple=aarch64-none-linux-gnu -mattr=+neon | FileCheck %s --check-prefix=LE +; RUN: llc < %s -verify-machineinstrs -mtriple=aarch64_be-none-linux-gnu -mattr=+neon | FileCheck %s --check-prefix=BE + +define <4 x i32> @fsext_v4i32(<4 x i8>* %a) { +; LE-LABEL: fsext_v4i32: +; LE: // %bb.0: +; LE-NEXT: ldrsb w8, [x0] +; LE-NEXT: ldrsb w9, [x0, #1] +; LE-NEXT: ldrsb w10, [x0, #2] +; LE-NEXT: ldrsb w11, [x0, #3] +; LE-NEXT: fmov s0, w8 +; LE-NEXT: mov v0.s[1], w9 +; LE-NEXT: mov v0.s[2], w10 +; LE-NEXT: mov v0.s[3], w11 +; LE-NEXT: ret +; +; BE-LABEL: fsext_v4i32: +; BE: // %bb.0: +; BE-NEXT: ldrsb w8, [x0] +; BE-NEXT: ldrsb w9, [x0, #1] +; BE-NEXT: ldrsb w10, [x0, #2] +; BE-NEXT: ldrsb w11, [x0, #3] +; BE-NEXT: fmov s0, w8 +; BE-NEXT: mov v0.s[1], w9 +; BE-NEXT: mov v0.s[2], w10 +; BE-NEXT: mov v0.s[3], w11 +; BE-NEXT: rev64 v0.4s, v0.4s +; BE-NEXT: ext v0.16b, v0.16b, v0.16b, #8 +; BE-NEXT: ret + %x = load <4 x i8>, <4 x i8>* %a + %y = sext <4 x i8> %x to <4 x i32> + ret <4 x i32> %y +} + +define <4 x i32> @fzext_v4i32(<4 x i8>* %a) { +; LE-LABEL: fzext_v4i32: +; LE: // %bb.0: +; LE-NEXT: ldrb w8, [x0] +; LE-NEXT: ldrb w9, [x0, #1] +; LE-NEXT: ldrb w10, [x0, #2] +; LE-NEXT: ldrb w11, [x0, #3] +; LE-NEXT: fmov s0, w8 +; LE-NEXT: mov v0.s[1], w9 +; LE-NEXT: mov v0.s[2], w10 +; LE-NEXT: mov v0.s[3], w11 +; LE-NEXT: ret +; +; BE-LABEL: fzext_v4i32: +; BE: // %bb.0: +; BE-NEXT: ldrb w8, [x0] +; BE-NEXT: ldrb w9, [x0, #1] +; BE-NEXT: ldrb w10, [x0, #2] +; BE-NEXT: ldrb w11, [x0, #3] +; BE-NEXT: fmov s0, w8 +; BE-NEXT: mov v0.s[1], w9 +; BE-NEXT: mov v0.s[2], w10 +; BE-NEXT: mov v0.s[3], w11 +; BE-NEXT: rev64 v0.4s, v0.4s +; BE-NEXT: ext v0.16b, v0.16b, v0.16b, #8 +; BE-NEXT: ret + %x = load <4 x i8>, <4 x i8>* %a + %y = zext <4 x i8> %x to <4 x i32> + ret <4 x i32> %y +} + +define i32 @loadExt.i32(<4 x i8>* %ref) { +; CHECK-LABEL: loadExt.i32: +; CHECK: ldrb +; LE-LABEL: loadExt.i32: +; LE: // %bb.0: +; LE-NEXT: ldrb w0, [x0] +; LE-NEXT: ret +; +; BE-LABEL: loadExt.i32: +; BE: // %bb.0: +; BE-NEXT: ldrb w0, [x0] +; BE-NEXT: ret + %a = load <4 x i8>, <4 x i8>* %ref + %vecext = extractelement <4 x i8> %a, i32 0 + %conv = zext i8 %vecext to i32 + ret i32 %conv +} + +define <4 x i16> @fsext_v4i16(<4 x i8>* %a) { +; LE-LABEL: fsext_v4i16: +; LE: // %bb.0: +; LE-NEXT: ldrsb w8, [x0] +; LE-NEXT: ldrsb w9, [x0, #1] +; LE-NEXT: ldrsb w10, [x0, #2] +; LE-NEXT: ldrsb w11, [x0, #3] +; LE-NEXT: fmov s0, w8 +; LE-NEXT: mov v0.h[1], w9 +; LE-NEXT: mov v0.h[2], w10 +; LE-NEXT: mov v0.h[3], w11 +; LE-NEXT: // kill: def $d0 killed $d0 killed $q0 +; LE-NEXT: ret +; +; BE-LABEL: fsext_v4i16: +; BE: // %bb.0: +; BE-NEXT: ldrsb w8, [x0] +; BE-NEXT: ldrsb w9, [x0, #1] +; BE-NEXT: ldrsb w10, [x0, #2] +; BE-NEXT: ldrsb w11, [x0, #3] +; BE-NEXT: fmov s0, w8 +; BE-NEXT: mov v0.h[1], w9 +; BE-NEXT: mov v0.h[2], w10 +; BE-NEXT: mov v0.h[3], w11 +; BE-NEXT: rev64 v0.4h, v0.4h +; BE-NEXT: ret + %x = load <4 x i8>, <4 x i8>* %a + %y = sext <4 x i8> %x to <4 x i16> + ret <4 x i16> %y +} + +define <4 x i16> @fzext_v4i16(<4 x i8>* %a) { +; LE-LABEL: fzext_v4i16: +; LE: // %bb.0: +; LE-NEXT: ldrb w8, [x0] +; LE-NEXT: ldrb w9, [x0, #1] +; LE-NEXT: ldrb w10, [x0, #2] +; LE-NEXT: ldrb w11, [x0, #3] +; LE-NEXT: fmov s0, w8 +; LE-NEXT: mov v0.h[1], w9 +; LE-NEXT: mov v0.h[2], w10 +; LE-NEXT: mov v0.h[3], w11 +; LE-NEXT: // kill: def $d0 killed $d0 killed $q0 +; LE-NEXT: ret +; +; BE-LABEL: fzext_v4i16: +; BE: // %bb.0: +; BE-NEXT: ldrb w8, [x0] +; BE-NEXT: ldrb w9, [x0, #1] +; BE-NEXT: ldrb w10, [x0, #2] +; BE-NEXT: ldrb w11, [x0, #3] +; BE-NEXT: fmov s0, w8 +; BE-NEXT: mov v0.h[1], w9 +; BE-NEXT: mov v0.h[2], w10 +; BE-NEXT: mov v0.h[3], w11 +; BE-NEXT: rev64 v0.4h, v0.4h +; BE-NEXT: ret + %x = load <4 x i8>, <4 x i8>* %a + %y = zext <4 x i8> %x to <4 x i16> + ret <4 x i16> %y +} diff --git a/llvm/test/CodeGen/AArch64/neon-truncStore-extLoad.ll b/llvm/test/CodeGen/AArch64/neon-truncstore.ll similarity index 66% rename from llvm/test/CodeGen/AArch64/neon-truncStore-extLoad.ll rename to llvm/test/CodeGen/AArch64/neon-truncstore.ll index 2f2f54f..2bbab0b 100644 --- a/llvm/test/CodeGen/AArch64/neon-truncStore-extLoad.ll +++ b/llvm/test/CodeGen/AArch64/neon-truncstore.ll @@ -38,30 +38,3 @@ define void @truncStore.v8i16(<8 x i16> %a, <8 x i8>* %result) { store <8 x i8> %b, <8 x i8>* %result ret void } - -; A vector LoadExt can not be selected. -; Test a vector load IR and a sext/zext IR can be selected correctly. -define <4 x i32> @loadSExt.v4i8(<4 x i8>* %ref) { -; CHECK-LABEL: loadSExt.v4i8: -; CHECK: ldrsb - %a = load <4 x i8>, <4 x i8>* %ref - %conv = sext <4 x i8> %a to <4 x i32> - ret <4 x i32> %conv -} - -define <4 x i32> @loadZExt.v4i8(<4 x i8>* %ref) { -; CHECK-LABEL: loadZExt.v4i8: -; CHECK: ldrb - %a = load <4 x i8>, <4 x i8>* %ref - %conv = zext <4 x i8> %a to <4 x i32> - ret <4 x i32> %conv -} - -define i32 @loadExt.i32(<4 x i8>* %ref) { -; CHECK-LABEL: loadExt.i32: -; CHECK: ldrb - %a = load <4 x i8>, <4 x i8>* %ref - %vecext = extractelement <4 x i8> %a, i32 0 - %conv = zext i8 %vecext to i32 - ret i32 %conv -}