Fix for the following bug in AVX codegen for double-to-int conversions:

author Victor Umansky <victor.umansky@intel.com>

Thu, 26 Jan 2012 08:51:39 +0000 (08:51 +0000)

committer Victor Umansky <victor.umansky@intel.com>

Thu, 26 Jan 2012 08:51:39 +0000 (08:51 +0000)
author Victor Umansky <victor.umansky@intel.com>
Thu, 26 Jan 2012 08:51:39 +0000 (08:51 +0000)
committer Victor Umansky <victor.umansky@intel.com>
Thu, 26 Jan 2012 08:51:39 +0000 (08:51 +0000)
diff --git a/lib/Target/X86/X86InstrSSE.td b/lib/Target/X86/X86InstrSSE.td

index 7b710f0928e1674a06faf9df593931143a5eacef..ac44473ca3c305ad6143ed07fbdea820801afcba 100644 (file)
--- a/lib/Target/X86/X86InstrSSE.td
+++ b/lib/Target/X86/X86InstrSSE.td
@@ -4693,9 +4693,9 @@ def CVTPD2DQrr  : S3DI<0xE6, MRMSrcReg, (outs VR128:$dst), (ins VR128:$src),
                         "cvtpd2dq\t{$src, $dst|$dst, $src}", []>;
  
  def : Pat<(v4i32 (fp_to_sint (v4f64 VR256:$src))),
-          (VCVTPD2DQYrr VR256:$src)>;
+          (VCVTTPD2DQYrr VR256:$src)>;
  def : Pat<(v4i32 (fp_to_sint (memopv4f64 addr:$src))),
-          (VCVTPD2DQYrm addr:$src)>;
+          (VCVTTPD2DQYrm addr:$src)>;
  
  // Convert Packed DW Integers to Packed Double FP
  let Predicates = [HasAVX] in {
diff --git a/test/CodeGen/X86/avx-cvt.ll b/test/CodeGen/X86/avx-cvt.ll

index 6c0bd58074d49ba8fd7017be32ea596f9656a073..d0a7fe01009e03fa959af2c173b20bf0fb1f84dd 100644 (file)
--- a/test/CodeGen/X86/avx-cvt.ll
+++ b/test/CodeGen/X86/avx-cvt.ll
@@ -18,7 +18,7 @@ define <4 x double> @sitofp01(<4 x i32> %a) {
    ret <4 x double> %b
  }
  
-; CHECK: vcvtpd2dqy %ymm
+; CHECK: vcvttpd2dqy %ymm
  define <4 x i32> @fptosi01(<4 x double> %a) {
    %b = fptosi <4 x double> %a to <4 x i32>
    ret <4 x i32> %b
diff --git a/test/CodeGen/X86/avx-fp2int.ll b/test/CodeGen/X86/avx-fp2int.ll

new file mode 100755 (executable)

index 0000000..9e505bd
--- /dev/null
+++ b/test/CodeGen/X86/avx-fp2int.ll
@@ -0,0 +1,19 @@
+; RUN: llc < %s -mtriple=i386-apple-darwin10 -mcpu=corei7-avx -mattr=+avx | FileCheck %s\r
+\r
+;; Check that FP_TO_SINT and FP_TO_UINT generate convert with truncate\r
+\r
+; CHECK: test1:\r
+; CHECK: vcvttpd2dqy\r
+; CHECK: ret\r
+; CHECK: test2:\r
+; CHECK: vcvttpd2dqy\r
+; CHECK: ret\r
+\r
+define <4 x i8> @test1(<4 x double> %d) {\r
+  %c = fptoui <4 x double> %d to <4 x i8>\r
+  ret <4 x i8> %c\r
+}\r
+define <4 x i8> @test2(<4 x double> %d) {\r
+  %c = fptosi <4 x double> %d to <4 x i8>\r
+  ret <4 x i8> %c\r
+}\r
author	Victor Umansky <victor.umansky@intel.com>
	Thu, 26 Jan 2012 08:51:39 +0000 (08:51 +0000)
committer	Victor Umansky <victor.umansky@intel.com>
	Thu, 26 Jan 2012 08:51:39 +0000 (08:51 +0000)
lib/Target/X86/X86InstrSSE.td		patch \| blob \| history
test/CodeGen/X86/avx-cvt.ll		patch \| blob \| history
test/CodeGen/X86/avx-fp2int.ll	[new file with mode: 0755]	patch \| blob