From c310bfa19397e15903a8f5386b51366aade414b9 Mon Sep 17 00:00:00 2001 From: Simon Pilgrim Date: Wed, 18 Apr 2018 20:47:48 +0000 Subject: [PATCH] [llvm-mca][X86] Add mmx versions of SSSE3 instructions Move PABS instructions incorrectly tested under SSE2 llvm-svn: 330295 --- .../tools/llvm-mca/X86/BtVer2/resources-sse2.s | 23 +--- .../tools/llvm-mca/X86/BtVer2/resources-ssse3.s | 135 ++++++++++++++++++++- 2 files changed, 135 insertions(+), 23 deletions(-) diff --git a/llvm/test/tools/llvm-mca/X86/BtVer2/resources-sse2.s b/llvm/test/tools/llvm-mca/X86/BtVer2/resources-sse2.s index ef9a842..4a3b22c 100644 --- a/llvm/test/tools/llvm-mca/X86/BtVer2/resources-sse2.s +++ b/llvm/test/tools/llvm-mca/X86/BtVer2/resources-sse2.s @@ -144,15 +144,6 @@ mulsd (%rax), %xmm2 orpd %xmm0, %xmm2 orpd (%rax), %xmm2 -pabsb %xmm0, %xmm2 -pabsb (%rax), %xmm2 - -pabsd %xmm0, %xmm2 -pabsd (%rax), %xmm2 - -pabsw %xmm0, %xmm2 -pabsw (%rax), %xmm2 - packssdw %xmm0, %xmm2 packssdw (%rax), %xmm2 @@ -483,12 +474,6 @@ xorpd (%rax), %xmm2 # CHECK-NEXT: 1 9 2.00 * mulsd (%rax), %xmm2 # CHECK-NEXT: 1 1 0.50 orpd %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * orpd (%rax), %xmm2 -# CHECK-NEXT: 1 1 0.50 pabsb %xmm0, %xmm2 -# CHECK-NEXT: 1 6 1.00 * pabsb (%rax), %xmm2 -# CHECK-NEXT: 1 1 0.50 pabsd %xmm0, %xmm2 -# CHECK-NEXT: 1 6 1.00 * pabsd (%rax), %xmm2 -# CHECK-NEXT: 1 1 0.50 pabsw %xmm0, %xmm2 -# CHECK-NEXT: 1 6 1.00 * pabsw (%rax), %xmm2 # CHECK-NEXT: 1 1 0.50 packssdw %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * packssdw (%rax), %xmm2 # CHECK-NEXT: 1 1 0.50 packsswb %xmm0, %xmm2 @@ -658,7 +643,7 @@ xorpd (%rax), %xmm2 # CHECK: Resource pressure per iteration: # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12] [13] -# CHECK-NEXT: 17.00 2.00 - 47.50 202.50 115.00 127.00 114.00 - 12.00 43.00 65.50 65.50 10.00 +# CHECK-NEXT: 17.00 2.00 - 47.50 202.50 112.00 124.00 111.00 - 12.00 43.00 62.50 62.50 10.00 # CHECK: Resource pressure by instruction: # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12] [13] Instructions: @@ -760,12 +745,6 @@ xorpd (%rax), %xmm2 # CHECK-NEXT: - - - - 2.00 - 1.00 1.00 - - - - - - mulsd (%rax), %xmm2 # CHECK-NEXT: - - - 0.50 0.50 0.50 0.50 - - - - - - - orpd %xmm0, %xmm2 # CHECK-NEXT: - - - 0.50 0.50 0.50 0.50 1.00 - - - - - - orpd (%rax), %xmm2 -# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - pabsb %xmm0, %xmm2 -# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - pabsb (%rax), %xmm2 -# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - pabsd %xmm0, %xmm2 -# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - pabsd (%rax), %xmm2 -# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - pabsw %xmm0, %xmm2 -# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - pabsw (%rax), %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - packssdw %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - packssdw (%rax), %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - packsswb %xmm0, %xmm2 diff --git a/llvm/test/tools/llvm-mca/X86/BtVer2/resources-ssse3.s b/llvm/test/tools/llvm-mca/X86/BtVer2/resources-ssse3.s index 13d2b3c..667e809 100644 --- a/llvm/test/tools/llvm-mca/X86/BtVer2/resources-ssse3.s +++ b/llvm/test/tools/llvm-mca/X86/BtVer2/resources-ssse3.s @@ -1,42 +1,99 @@ # NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py # RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=btver2 -instruction-tables < %s | FileCheck %s +pabsb %mm0, %mm2 +pabsb (%rax), %mm2 + +pabsb %xmm0, %xmm2 +pabsb (%rax), %xmm2 + +pabsd %mm0, %mm2 +pabsd (%rax), %mm2 + +pabsd %xmm0, %xmm2 +pabsd (%rax), %xmm2 + +pabsw %mm0, %mm2 +pabsw (%rax), %mm2 + +pabsw %xmm0, %xmm2 +pabsw (%rax), %xmm2 + +palignr $1, %mm0, %mm2 +palignr $1, (%rax), %mm2 + palignr $1, %xmm0, %xmm2 palignr $1, (%rax), %xmm2 +phaddd %mm0, %mm2 +phaddd (%rax), %mm2 + phaddd %xmm0, %xmm2 phaddd (%rax), %xmm2 +phaddsw %mm0, %mm2 +phaddsw (%rax), %mm2 + phaddsw %xmm0, %xmm2 phaddsw (%rax), %xmm2 +phaddw %mm0, %mm2 +phaddw (%rax), %mm2 + phaddw %xmm0, %xmm2 phaddw (%rax), %xmm2 +phsubd %mm0, %mm2 +phsubd (%rax), %mm2 + phsubd %xmm0, %xmm2 phsubd (%rax), %xmm2 +phsubsw %mm0, %mm2 +phsubsw (%rax), %mm2 + phsubsw %xmm0, %xmm2 phsubsw (%rax), %xmm2 +phsubw %mm0, %mm2 +phsubw (%rax), %mm2 + phsubw %xmm0, %xmm2 phsubw (%rax), %xmm2 +pmaddubsw %mm0, %mm2 +pmaddubsw (%rax), %mm2 + pmaddubsw %xmm0, %xmm2 pmaddubsw (%rax), %xmm2 +pmulhrsw %mm0, %mm2 +pmulhrsw (%rax), %mm2 + pmulhrsw %xmm0, %xmm2 pmulhrsw (%rax), %xmm2 +pshufb %mm0, %mm2 +pshufb (%rax), %mm2 + pshufb %xmm0, %xmm2 pshufb (%rax), %xmm2 +psignb %mm0, %mm2 +psignb (%rax), %mm2 + psignb %xmm0, %xmm2 psignb (%rax), %xmm2 +psignd %mm0, %mm2 +psignd (%rax), %mm2 + psignd %xmm0, %xmm2 psignd (%rax), %xmm2 +psignw %mm0, %mm2 +psignw (%rax), %mm2 + psignw %xmm0, %xmm2 psignw (%rax), %xmm2 @@ -49,30 +106,68 @@ psignw (%rax), %xmm2 # CHECK-NEXT: [6]: HasSideEffects # CHECK: [1] [2] [3] [4] [5] [6] Instructions: +# CHECK-NEXT: 1 1 0.50 pabsb %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * pabsb (%rax), %mm2 +# CHECK-NEXT: 1 1 0.50 pabsb %xmm0, %xmm2 +# CHECK-NEXT: 1 6 1.00 * pabsb (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 pabsd %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * pabsd (%rax), %mm2 +# CHECK-NEXT: 1 1 0.50 pabsd %xmm0, %xmm2 +# CHECK-NEXT: 1 6 1.00 * pabsd (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 pabsw %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * pabsw (%rax), %mm2 +# CHECK-NEXT: 1 1 0.50 pabsw %xmm0, %xmm2 +# CHECK-NEXT: 1 6 1.00 * pabsw (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 palignr $1, %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * palignr $1, (%rax), %mm2 # CHECK-NEXT: 1 1 0.50 palignr $1, %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * palignr $1, (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 phaddd %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * phaddd (%rax), %mm2 # CHECK-NEXT: 1 1 0.50 phaddd %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * phaddd (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 phaddsw %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * phaddsw (%rax), %mm2 # CHECK-NEXT: 1 1 0.50 phaddsw %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * phaddsw (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 phaddw %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * phaddw (%rax), %mm2 # CHECK-NEXT: 1 1 0.50 phaddw %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * phaddw (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 phsubd %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * phsubd (%rax), %mm2 # CHECK-NEXT: 1 1 0.50 phsubd %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * phsubd (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 phsubsw %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * phsubsw (%rax), %mm2 # CHECK-NEXT: 1 1 0.50 phsubsw %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * phsubsw (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 phsubw %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * phsubw (%rax), %mm2 # CHECK-NEXT: 1 1 0.50 phsubw %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * phsubw (%rax), %xmm2 +# CHECK-NEXT: 1 2 1.00 pmaddubsw %mm0, %mm2 +# CHECK-NEXT: 1 7 1.00 * pmaddubsw (%rax), %mm2 # CHECK-NEXT: 1 2 1.00 pmaddubsw %xmm0, %xmm2 # CHECK-NEXT: 1 7 1.00 * pmaddubsw (%rax), %xmm2 +# CHECK-NEXT: 1 2 1.00 pmulhrsw %mm0, %mm2 +# CHECK-NEXT: 1 7 1.00 * pmulhrsw (%rax), %mm2 # CHECK-NEXT: 1 2 1.00 pmulhrsw %xmm0, %xmm2 # CHECK-NEXT: 1 7 1.00 * pmulhrsw (%rax), %xmm2 +# CHECK-NEXT: 3 2 2.00 pshufb %mm0, %mm2 +# CHECK-NEXT: 3 7 2.00 * pshufb (%rax), %mm2 # CHECK-NEXT: 3 2 2.00 pshufb %xmm0, %xmm2 # CHECK-NEXT: 3 7 2.00 * pshufb (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 psignb %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * psignb (%rax), %mm2 # CHECK-NEXT: 1 1 0.50 psignb %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * psignb (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 psignd %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * psignd (%rax), %mm2 # CHECK-NEXT: 1 1 0.50 psignd %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * psignd (%rax), %xmm2 +# CHECK-NEXT: 1 1 0.50 psignw %mm0, %mm2 +# CHECK-NEXT: 1 6 1.00 * psignw (%rax), %mm2 # CHECK-NEXT: 1 1 0.50 psignw %xmm0, %xmm2 # CHECK-NEXT: 1 6 1.00 * psignw (%rax), %xmm2 @@ -94,34 +189,72 @@ psignw (%rax), %xmm2 # CHECK: Resource pressure per iteration: # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12] [13] -# CHECK-NEXT: - - - - - 15.00 11.00 13.00 - - - 14.00 14.00 4.00 +# CHECK-NEXT: - - - - - 36.00 28.00 32.00 - - - 34.00 34.00 8.00 # CHECK: Resource pressure by instruction: # CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] [12] [13] Instructions: +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - pabsb %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - pabsb (%rax), %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - pabsb %xmm0, %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - pabsb (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - pabsd %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - pabsd (%rax), %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - pabsd %xmm0, %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - pabsd (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - pabsw %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - pabsw (%rax), %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - pabsw %xmm0, %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - pabsw (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - palignr $1, %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - palignr $1, (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - palignr $1, %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - palignr $1, (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phaddd %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phaddd (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phaddd %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phaddd (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phaddsw %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phaddsw (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phaddsw %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phaddsw (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phaddw %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phaddw (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phaddw %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phaddw (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phsubd %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phsubd (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phsubd %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phsubd (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phsubsw %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phsubsw (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phsubsw %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phsubsw (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phsubw %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phsubw (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - phsubw %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - phsubw (%rax), %xmm2 +# CHECK-NEXT: - - - - - 1.00 - - - - - - - 1.00 pmaddubsw %mm0, %mm2 +# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - - 1.00 pmaddubsw (%rax), %mm2 # CHECK-NEXT: - - - - - 1.00 - - - - - - - 1.00 pmaddubsw %xmm0, %xmm2 # CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - - 1.00 pmaddubsw (%rax), %xmm2 +# CHECK-NEXT: - - - - - 1.00 - - - - - - - 1.00 pmulhrsw %mm0, %mm2 +# CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - - 1.00 pmulhrsw (%rax), %mm2 # CHECK-NEXT: - - - - - 1.00 - - - - - - - 1.00 pmulhrsw %xmm0, %xmm2 # CHECK-NEXT: - - - - - 1.00 - 1.00 - - - - - 1.00 pmulhrsw (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 2.00 2.00 - pshufb %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 2.00 2.00 - pshufb (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 2.00 2.00 - pshufb %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 2.00 2.00 - pshufb (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - psignb %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - psignb (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - psignb %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - psignb (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - psignd %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - psignd (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - psignd %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - psignd (%rax), %xmm2 +# CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - psignw %mm0, %mm2 +# CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - psignw (%rax), %mm2 # CHECK-NEXT: - - - - - 0.50 0.50 - - - - 0.50 0.50 - psignw %xmm0, %xmm2 # CHECK-NEXT: - - - - - 0.50 0.50 1.00 - - - 0.50 0.50 - psignw (%rax), %xmm2 -- 2.7.4