From 6e557e28ecf41353f207bc93d1a718ec508a68ff Mon Sep 17 00:00:00 2001 From: Chen Zheng Date: Mon, 7 Nov 2022 02:03:48 -0500 Subject: [PATCH] [PowerPC][NFC] use script to generate check lines --- llvm/test/CodeGen/PowerPC/ctrloop-fp128.ll | 207 +++++++++++++++++++++++++++-- 1 file changed, 193 insertions(+), 14 deletions(-) diff --git a/llvm/test/CodeGen/PowerPC/ctrloop-fp128.ll b/llvm/test/CodeGen/PowerPC/ctrloop-fp128.ll index de0441f..3c9f39f 100644 --- a/llvm/test/CodeGen/PowerPC/ctrloop-fp128.ll +++ b/llvm/test/CodeGen/PowerPC/ctrloop-fp128.ll @@ -1,11 +1,91 @@ -; RUN: llc < %s -verify-machineinstrs -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown | FileCheck %s -; RUN: llc < %s -verify-machineinstrs -mcpu=pwr8 -mtriple=powerpc64le-unknown-unknown | FileCheck %s +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc < %s -verify-machineinstrs -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown | FileCheck %s -check-prefix=PWR9 +; RUN: llc < %s -verify-machineinstrs -mcpu=pwr8 -mtriple=powerpc64le-unknown-unknown | FileCheck %s -check-prefix=PWR8 @a = internal global fp128 0xL00000000000000000000000000000000, align 16 @x = internal global [4 x fp128] zeroinitializer, align 16 @y = internal global [4 x fp128] zeroinitializer, align 16 -define void @fmul_ctrloop_fp128() { +define void @fmul_ctrloop_fp128() nounwind { +; PWR9-LABEL: fmul_ctrloop_fp128: +; PWR9: # %bb.0: # %entry +; PWR9-NEXT: addis 5, 2, a@toc@ha +; PWR9-NEXT: addis 3, 2, y@toc@ha +; PWR9-NEXT: addis 4, 2, x@toc@ha +; PWR9-NEXT: addi 5, 5, a@toc@l +; PWR9-NEXT: addi 3, 3, y@toc@l +; PWR9-NEXT: addi 4, 4, x@toc@l +; PWR9-NEXT: lxv 34, 0(5) +; PWR9-NEXT: addi 3, 3, -16 +; PWR9-NEXT: addi 4, 4, -16 +; PWR9-NEXT: li 5, 0 +; PWR9-NEXT: .p2align 5 +; PWR9-NEXT: .LBB0_1: # %for.body +; PWR9-NEXT: # +; PWR9-NEXT: lxv 35, 16(4) +; PWR9-NEXT: addi 5, 5, 16 +; PWR9-NEXT: addi 4, 4, 16 +; PWR9-NEXT: cmpldi 5, 64 +; PWR9-NEXT: xsmulqp 3, 2, 3 +; PWR9-NEXT: stxv 35, 16(3) +; PWR9-NEXT: addi 3, 3, 16 +; PWR9-NEXT: bne 0, .LBB0_1 +; PWR9-NEXT: # %bb.2: # %for.end +; PWR9-NEXT: blr +; +; PWR8-LABEL: fmul_ctrloop_fp128: +; PWR8: # %bb.0: # %entry +; PWR8-NEXT: mflr 0 +; PWR8-NEXT: std 0, 16(1) +; PWR8-NEXT: stdu 1, -112(1) +; PWR8-NEXT: li 3, 48 +; PWR8-NEXT: addis 4, 2, x@toc@ha +; PWR8-NEXT: std 28, 80(1) # 8-byte Folded Spill +; PWR8-NEXT: std 29, 88(1) # 8-byte Folded Spill +; PWR8-NEXT: std 30, 96(1) # 8-byte Folded Spill +; PWR8-NEXT: li 30, 0 +; PWR8-NEXT: li 29, 16 +; PWR8-NEXT: addi 4, 4, x@toc@l +; PWR8-NEXT: std 26, 64(1) # 8-byte Folded Spill +; PWR8-NEXT: stxvd2x 63, 1, 3 # 16-byte Folded Spill +; PWR8-NEXT: addis 3, 2, a@toc@ha +; PWR8-NEXT: std 27, 72(1) # 8-byte Folded Spill +; PWR8-NEXT: addi 3, 3, a@toc@l +; PWR8-NEXT: lxvd2x 0, 0, 3 +; PWR8-NEXT: addis 3, 2, y@toc@ha +; PWR8-NEXT: addi 3, 3, y@toc@l +; PWR8-NEXT: addi 28, 3, -16 +; PWR8-NEXT: addi 3, 4, -16 +; PWR8-NEXT: xxswapd 63, 0 +; PWR8-NEXT: .p2align 4 +; PWR8-NEXT: .LBB0_1: # %for.body +; PWR8-NEXT: # +; PWR8-NEXT: lxvd2x 0, 3, 29 +; PWR8-NEXT: vmr 2, 31 +; PWR8-NEXT: addi 27, 28, 16 +; PWR8-NEXT: addi 26, 3, 16 +; PWR8-NEXT: xxswapd 35, 0 +; PWR8-NEXT: bl __mulkf3 +; PWR8-NEXT: nop +; PWR8-NEXT: xxswapd 0, 34 +; PWR8-NEXT: addi 30, 30, 16 +; PWR8-NEXT: mr 3, 26 +; PWR8-NEXT: cmpldi 30, 64 +; PWR8-NEXT: stxvd2x 0, 28, 29 +; PWR8-NEXT: mr 28, 27 +; PWR8-NEXT: bne 0, .LBB0_1 +; PWR8-NEXT: # %bb.2: # %for.end +; PWR8-NEXT: li 3, 48 +; PWR8-NEXT: ld 30, 96(1) # 8-byte Folded Reload +; PWR8-NEXT: ld 29, 88(1) # 8-byte Folded Reload +; PWR8-NEXT: ld 28, 80(1) # 8-byte Folded Reload +; PWR8-NEXT: ld 27, 72(1) # 8-byte Folded Reload +; PWR8-NEXT: lxvd2x 63, 1, 3 # 16-byte Folded Reload +; PWR8-NEXT: ld 26, 64(1) # 8-byte Folded Reload +; PWR8-NEXT: addi 1, 1, 112 +; PWR8-NEXT: ld 0, 16(1) +; PWR8-NEXT: mtlr 0 +; PWR8-NEXT: blr entry: %0 = load fp128, ptr @a, align 16 br label %for.body @@ -23,12 +103,63 @@ for.body: ; preds = %for.body, %entry for.end: ; preds = %for.body ret void - -; CHECK-LABEL: fmul_ctrloop_fp128 -; CHECK-NOT: mtctr } -define void @fpext_ctrloop_fp128(ptr %a) { +define void @fpext_ctrloop_fp128(ptr %a) nounwind { +; PWR9-LABEL: fpext_ctrloop_fp128: +; PWR9: # %bb.0: # %entry +; PWR9-NEXT: addis 4, 2, y@toc@ha +; PWR9-NEXT: addi 3, 3, -8 +; PWR9-NEXT: addi 4, 4, y@toc@l +; PWR9-NEXT: addi 5, 4, -16 +; PWR9-NEXT: li 4, 0 +; PWR9-NEXT: .p2align 5 +; PWR9-NEXT: .LBB1_1: # %for.body +; PWR9-NEXT: # +; PWR9-NEXT: lfdu 0, 8(3) +; PWR9-NEXT: addi 4, 4, 8 +; PWR9-NEXT: cmpldi 4, 32 +; PWR9-NEXT: xscpsgndp 34, 0, 0 +; PWR9-NEXT: xscvdpqp 2, 2 +; PWR9-NEXT: stxv 34, 16(5) +; PWR9-NEXT: addi 5, 5, 16 +; PWR9-NEXT: bne 0, .LBB1_1 +; PWR9-NEXT: # %bb.2: # %for.end +; PWR9-NEXT: blr +; +; PWR8-LABEL: fpext_ctrloop_fp128: +; PWR8: # %bb.0: # %entry +; PWR8-NEXT: mflr 0 +; PWR8-NEXT: std 28, -32(1) # 8-byte Folded Spill +; PWR8-NEXT: std 29, -24(1) # 8-byte Folded Spill +; PWR8-NEXT: std 30, -16(1) # 8-byte Folded Spill +; PWR8-NEXT: std 0, 16(1) +; PWR8-NEXT: stdu 1, -64(1) +; PWR8-NEXT: addis 4, 2, y@toc@ha +; PWR8-NEXT: addi 30, 3, -8 +; PWR8-NEXT: li 28, 0 +; PWR8-NEXT: addi 4, 4, y@toc@l +; PWR8-NEXT: addi 29, 4, -16 +; PWR8-NEXT: .p2align 4 +; PWR8-NEXT: .LBB1_1: # %for.body +; PWR8-NEXT: # +; PWR8-NEXT: lfdu 1, 8(30) +; PWR8-NEXT: addi 29, 29, 16 +; PWR8-NEXT: bl __extenddfkf2 +; PWR8-NEXT: nop +; PWR8-NEXT: xxswapd 0, 34 +; PWR8-NEXT: addi 28, 28, 8 +; PWR8-NEXT: cmpldi 28, 32 +; PWR8-NEXT: stxvd2x 0, 0, 29 +; PWR8-NEXT: bne 0, .LBB1_1 +; PWR8-NEXT: # %bb.2: # %for.end +; PWR8-NEXT: addi 1, 1, 64 +; PWR8-NEXT: ld 0, 16(1) +; PWR8-NEXT: ld 30, -16(1) # 8-byte Folded Reload +; PWR8-NEXT: ld 29, -24(1) # 8-byte Folded Reload +; PWR8-NEXT: ld 28, -32(1) # 8-byte Folded Reload +; PWR8-NEXT: mtlr 0 +; PWR8-NEXT: blr entry: br label %for.body @@ -45,12 +176,63 @@ for.body: for.end: ret void - -; CHECK-LABEL: fpext_ctrloop_fp128 -; CHECK-NOT: mtctr } -define void @fptrunc_ctrloop_fp128(ptr %a) { +define void @fptrunc_ctrloop_fp128(ptr %a) nounwind { +; PWR9-LABEL: fptrunc_ctrloop_fp128: +; PWR9: # %bb.0: # %entry +; PWR9-NEXT: addis 4, 2, x@toc@ha +; PWR9-NEXT: addi 3, 3, -8 +; PWR9-NEXT: li 5, 0 +; PWR9-NEXT: addi 4, 4, x@toc@l +; PWR9-NEXT: addi 4, 4, -16 +; PWR9-NEXT: .p2align 5 +; PWR9-NEXT: .LBB2_1: # %for.body +; PWR9-NEXT: # +; PWR9-NEXT: lxv 34, 16(4) +; PWR9-NEXT: addi 5, 5, 8 +; PWR9-NEXT: addi 4, 4, 16 +; PWR9-NEXT: cmpldi 5, 32 +; PWR9-NEXT: xscvqpdp 2, 2 +; PWR9-NEXT: xscpsgndp 0, 34, 34 +; PWR9-NEXT: stfdu 0, 8(3) +; PWR9-NEXT: bne 0, .LBB2_1 +; PWR9-NEXT: # %bb.2: # %for.end +; PWR9-NEXT: blr +; +; PWR8-LABEL: fptrunc_ctrloop_fp128: +; PWR8: # %bb.0: # %entry +; PWR8-NEXT: mflr 0 +; PWR8-NEXT: std 28, -32(1) # 8-byte Folded Spill +; PWR8-NEXT: std 29, -24(1) # 8-byte Folded Spill +; PWR8-NEXT: std 30, -16(1) # 8-byte Folded Spill +; PWR8-NEXT: std 0, 16(1) +; PWR8-NEXT: stdu 1, -64(1) +; PWR8-NEXT: addis 4, 2, x@toc@ha +; PWR8-NEXT: addi 30, 3, -8 +; PWR8-NEXT: li 28, 0 +; PWR8-NEXT: addi 4, 4, x@toc@l +; PWR8-NEXT: addi 29, 4, -16 +; PWR8-NEXT: .p2align 4 +; PWR8-NEXT: .LBB2_1: # %for.body +; PWR8-NEXT: # +; PWR8-NEXT: addi 29, 29, 16 +; PWR8-NEXT: lxvd2x 0, 0, 29 +; PWR8-NEXT: xxswapd 34, 0 +; PWR8-NEXT: bl __trunckfdf2 +; PWR8-NEXT: nop +; PWR8-NEXT: addi 28, 28, 8 +; PWR8-NEXT: stfdu 1, 8(30) +; PWR8-NEXT: cmpldi 28, 32 +; PWR8-NEXT: bne 0, .LBB2_1 +; PWR8-NEXT: # %bb.2: # %for.end +; PWR8-NEXT: addi 1, 1, 64 +; PWR8-NEXT: ld 0, 16(1) +; PWR8-NEXT: ld 30, -16(1) # 8-byte Folded Reload +; PWR8-NEXT: ld 29, -24(1) # 8-byte Folded Reload +; PWR8-NEXT: ld 28, -32(1) # 8-byte Folded Reload +; PWR8-NEXT: mtlr 0 +; PWR8-NEXT: blr entry: br label %for.body @@ -67,9 +249,6 @@ for.body: for.end: ret void - -; CHECK-LABEL: fptrunc_ctrloop_fp128 -; CHECK-NOT: mtctr } declare void @obfuscate(ptr, ...) local_unnamed_addr #2 -- 2.7.4