[X86][FastISel] Don't force Nearest-Even rounding for VCVTPS2PH, use MXCSR.

author Ahmed Bougacha <ahmed.bougacha@gmail.com>

Tue, 2 Feb 2016 01:44:03 +0000 (01:44 +0000)

committer Ahmed Bougacha <ahmed.bougacha@gmail.com>

Tue, 2 Feb 2016 01:44:03 +0000 (01:44 +0000)
author Ahmed Bougacha <ahmed.bougacha@gmail.com>
Tue, 2 Feb 2016 01:44:03 +0000 (01:44 +0000)
committer Ahmed Bougacha <ahmed.bougacha@gmail.com>
Tue, 2 Feb 2016 01:44:03 +0000 (01:44 +0000)
diff --git a/llvm/lib/Target/X86/X86FastISel.cpp b/llvm/lib/Target/X86/X86FastISel.cpp

index f48b479..854a4e7 100644 (file)
--- a/llvm/lib/Target/X86/X86FastISel.cpp
+++ b/llvm/lib/Target/X86/X86FastISel.cpp
@@ -2294,8 +2294,10 @@ bool X86FastISel::fastLowerIntrinsicCall(const IntrinsicInst *II) {
        // register class VR128 by method 'constrainOperandRegClass' which is
        // directly called by 'fastEmitInst_ri'.
        // Instruction VCVTPS2PHrr takes an extra immediate operand which is
-      // used to provide rounding control.
-      InputReg = fastEmitInst_ri(X86::VCVTPS2PHrr, RC, InputReg, false, 0);
+      // used to provide rounding control: use MXCSR.RC, encoded as 0b100.
+      // It's consistent with the other FP instructions, which are usually
+      // controlled by MXCSR.
+      InputReg = fastEmitInst_ri(X86::VCVTPS2PHrr, RC, InputReg, false, 4);
  
        // Move the lower 32-bits of ResultReg to another register of class GR32.
        ResultReg = createResultReg(&X86::GR32RegClass);
diff --git a/llvm/test/CodeGen/X86/fast-isel-float-half-convertion.ll b/llvm/test/CodeGen/X86/fast-isel-float-half-convertion.ll

index 707a325..acb85fd 100644 (file)
--- a/llvm/test/CodeGen/X86/fast-isel-float-half-convertion.ll
+++ b/llvm/test/CodeGen/X86/fast-isel-float-half-convertion.ll
@@ -4,7 +4,7 @@
  
  define i16 @test_fp32_to_fp16(float %a) {
  ; CHECK-LABEL: test_fp32_to_fp16:
-; CHECK: vcvtps2ph $0, %xmm0, %xmm0
+; CHECK: vcvtps2ph $4, %xmm0, %xmm0
  ; CHECK-NEXT: vmovd %xmm0, %eax
  ; CHECK-NEXT: retq
  entry:
author	Ahmed Bougacha <ahmed.bougacha@gmail.com>
	Tue, 2 Feb 2016 01:44:03 +0000 (01:44 +0000)
committer	Ahmed Bougacha <ahmed.bougacha@gmail.com>
	Tue, 2 Feb 2016 01:44:03 +0000 (01:44 +0000)
llvm/lib/Target/X86/X86FastISel.cpp		patch \| blob \| history
llvm/test/CodeGen/X86/fast-isel-float-half-convertion.ll		patch \| blob \| history