[X86] Add initialization of FPCW in llvm-exegesis
authorWang, Pengfei <pengfei.wang@intel.com>
Mon, 2 Dec 2019 11:39:16 +0000 (19:39 +0800)
committerWang, Pengfei <pengfei.wang@intel.com>
Mon, 2 Dec 2019 12:18:35 +0000 (20:18 +0800)
Summary: This is a following up to D70874. It adds the initialization of FPCW in llvm-exegesis.

Reviewers: craig.topper, RKSimon, courbet, gchatelet

Subscribers: tschuett, llvm-commits

Tags: #llvm

Differential Revision: https://reviews.llvm.org/D70891

llvm/test/tools/llvm-exegesis/X86/uops-ADD_F32m.s [new file with mode: 0644]
llvm/tools/llvm-exegesis/lib/X86/Target.cpp

diff --git a/llvm/test/tools/llvm-exegesis/X86/uops-ADD_F32m.s b/llvm/test/tools/llvm-exegesis/X86/uops-ADD_F32m.s
new file mode 100644 (file)
index 0000000..023fa78
--- /dev/null
@@ -0,0 +1,9 @@
+# RUN: llvm-exegesis -mode=uops -opcode-name=ADD_F32m -repetition-mode=duplicate | FileCheck %s
+# RUN: llvm-exegesis -mode=uops -opcode-name=ADD_F32m -repetition-mode=loop | FileCheck %s
+
+CHECK:      mode:            uops
+CHECK-NEXT: key:
+CHECK-NEXT:   instructions:
+CHECK-NEXT:     ADD_F32m
+CHECK:      register_initial_values:
+CHECK:      FPCW
index 974b2c9..08724dd 100644 (file)
@@ -439,7 +439,8 @@ struct ConstantInliner {
 
   std::vector<MCInst> popFlagAndFinalize();
 
-  std::vector<MCInst> loadMXCSRAndFinalize(bool HasAVX);
+  std::vector<MCInst> loadImplicitRegAndFinalize(unsigned Opcode,
+                                                 unsigned Value);
 
 private:
   ConstantInliner &add(const MCInst &Inst) {
@@ -501,10 +502,11 @@ std::vector<MCInst> ConstantInliner::popFlagAndFinalize() {
   return std::move(Instructions);
 }
 
-std::vector<MCInst> ConstantInliner::loadMXCSRAndFinalize(bool HasAVX) {
+std::vector<MCInst>
+ConstantInliner::loadImplicitRegAndFinalize(unsigned Opcode, unsigned Value) {
   add(allocateStackSpace(4));
-  add(fillStackSpace(X86::MOV32mi, 0, 0x1f80)); // Mask all FP exceptions
-  add(MCInstBuilder(HasAVX ? X86::VLDMXCSR : X86::LDMXCSR)
+  add(fillStackSpace(X86::MOV32mi, 0, Value)); // Mask all FP exceptions
+  add(MCInstBuilder(Opcode)
           // Address = ESP
           .addReg(X86::RSP) // BaseReg
           .addImm(1)        // ScaleAmt
@@ -715,7 +717,11 @@ std::vector<MCInst> ExegesisX86Target::setRegTo(const MCSubtargetInfo &STI,
   if (Reg == X86::EFLAGS)
     return CI.popFlagAndFinalize();
   if (Reg == X86::MXCSR)
-    return CI.loadMXCSRAndFinalize(STI.getFeatureBits()[X86::FeatureAVX]);
+    return CI.loadImplicitRegAndFinalize(
+              STI.getFeatureBits()[X86::FeatureAVX] ? X86::VLDMXCSR
+                                                    : X86::LDMXCSR, 0x1f80);
+  if (Reg == X86::FPCW)
+    return CI.loadImplicitRegAndFinalize(X86::FLDCW16m, 0x37f);
   return {}; // Not yet implemented.
 }