Fix VINSERTF128/VEXTRACTF128 to be marked as FP instructions. Allow execution depende...

author Craig Topper <craig.topper@gmail.com>

Tue, 29 Nov 2011 05:37:58 +0000 (05:37 +0000)

committer Craig Topper <craig.topper@gmail.com>

Tue, 29 Nov 2011 05:37:58 +0000 (05:37 +0000)
author Craig Topper <craig.topper@gmail.com>
Tue, 29 Nov 2011 05:37:58 +0000 (05:37 +0000)
committer Craig Topper <craig.topper@gmail.com>
Tue, 29 Nov 2011 05:37:58 +0000 (05:37 +0000)
diff --git a/lib/Target/X86/X86InstrInfo.cpp b/lib/Target/X86/X86InstrInfo.cpp

index 5d310af3eb6d582f738c23d670644ee71acbb03a..b28f9c1e7c199b966b8469a4c46d0d7156985598 100644 (file)
--- a/lib/Target/X86/X86InstrInfo.cpp
+++ b/lib/Target/X86/X86InstrInfo.cpp
@@ -3568,10 +3568,14 @@ static const unsigned ReplaceableInstrsAVX2[][3] = {
    { X86::VANDPSYrr,    X86::VANDPDYrr,    X86::VPANDYrr    },
    { X86::VORPSYrm,     X86::VORPDYrm,     X86::VPORYrm     },
    { X86::VORPSYrr,     X86::VORPDYrr,     X86::VPORYrr     },
-  { X86::VPERM2F128rm, X86::VPERM2F128rm, X86::VPERM2I128rm },
-  { X86::VPERM2F128rr, X86::VPERM2F128rr, X86::VPERM2I128rr },
    { X86::VXORPSYrm,    X86::VXORPDYrm,    X86::VPXORYrm    },
-  { X86::VXORPSYrr,    X86::VXORPDYrr,    X86::VPXORYrr    }
+  { X86::VXORPSYrr,    X86::VXORPDYrr,    X86::VPXORYrr    },
+  { X86::VEXTRACTF128mr, X86::VEXTRACTF128mr, X86::VEXTRACTI128mr },
+  { X86::VEXTRACTF128rr, X86::VEXTRACTF128rr, X86::VEXTRACTI128rr },
+  { X86::VINSERTF128rm,  X86::VINSERTF128rm,  X86::VINSERTI128rm },
+  { X86::VINSERTF128rr,  X86::VINSERTF128rr,  X86::VINSERTI128rr },
+  { X86::VPERM2F128rm,   X86::VPERM2F128rm,   X86::VPERM2I128rm },
+  { X86::VPERM2F128rr,   X86::VPERM2F128rr,   X86::VPERM2I128rr }
  };
  
  // FIXME: Some shuffle and unpack instructions have equivalents in different
diff --git a/lib/Target/X86/X86InstrSSE.td b/lib/Target/X86/X86InstrSSE.td

index 0be59ccd87bcada0059b2b3d9fae4a620bdd5433..1d8e3ce284d9e125cd50477e618d7dbd4687c4be 100644 (file)
--- a/lib/Target/X86/X86InstrSSE.td
+++ b/lib/Target/X86/X86InstrSSE.td
@@ -7147,7 +7147,7 @@ def : Pat<(int_x86_avx_vbroadcastf128_ps_256 addr:$src),
  //===----------------------------------------------------------------------===//
  // VINSERTF128 - Insert packed floating-point values
  //
-let neverHasSideEffects = 1 in {
+let neverHasSideEffects = 1, ExeDomain = SSEPackedSingle in {
  def VINSERTF128rr : AVXAIi8<0x18, MRMSrcReg, (outs VR256:$dst),
            (ins VR256:$src1, VR128:$src2, i8imm:$src3),
            "vinsertf128\t{$src3, $src2, $src1, $dst|$dst, $src1, $src2, $src3}",
@@ -7194,7 +7194,7 @@ def : Pat<(vinsertf128_insert:$ins (v16i16 VR256:$src1), (v8i16 VR128:$src2),
  //===----------------------------------------------------------------------===//
  // VEXTRACTF128 - Extract packed floating-point values
  //
-let neverHasSideEffects = 1 in {
+let neverHasSideEffects = 1, ExeDomain = SSEPackedSingle in {
  def VEXTRACTF128rr : AVXAIi8<0x19, MRMDestReg, (outs VR128:$dst),
            (ins VR256:$src1, i8imm:$src2),
            "vextractf128\t{$src2, $src1, $dst|$dst, $src1, $src2}",
diff --git a/test/CodeGen/X86/avx-cast.ll b/test/CodeGen/X86/avx-cast.ll

index d6d2415ea0593f735e1859ae373133d7f5cdacb4..32d450cac9f9afd92c242fdff28ab60476896390 100644 (file)
--- a/test/CodeGen/X86/avx-cast.ll
+++ b/test/CodeGen/X86/avx-cast.ll
@@ -16,7 +16,7 @@ entry:
    ret <4 x double> %shuffle.i
  }
  
-; CHECK: vpxor
+; CHECK: vxorps
  ; CHECK-NEXT: vinsertf128 $0
  define <4 x i64> @castC(<2 x i64> %m) nounwind uwtable readnone ssp {
  entry:
diff --git a/test/CodeGen/X86/avx-intrinsics-x86.ll b/test/CodeGen/X86/avx-intrinsics-x86.ll

index 57e73121549dde3d5df03557e254898d13cc48c9..eccc842406a2e9db17eade213337852b0bb513fa 100644 (file)
--- a/test/CodeGen/X86/avx-intrinsics-x86.ll
+++ b/test/CodeGen/X86/avx-intrinsics-x86.ll
@@ -2140,7 +2140,8 @@ declare <8 x float> @llvm.x86.avx.sqrt.ps.256(<8 x float>) nounwind readnone
  
  
  define void @test_x86_avx_storeu_dq_256(i8* %a0, <32 x i8> %a1) {
-  ; CHECK: vmovdqu
+  ; FIXME: unfortunately the execution domain fix pass changes this to vmovups and its hard to force with no 256-bit integer instructions
+  ; CHECK: vmovups
    ; add operation forces the execution domain.
    %a2 = add <32 x i8> %a1, <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>
    call void @llvm.x86.avx.storeu.dq.256(i8* %a0, <32 x i8> %a2)
diff --git a/test/CodeGen/X86/avx-splat.ll b/test/CodeGen/X86/avx-splat.ll

index af20b90322e173b567e36a5cfa2018c95f61d4aa..f8522c269515d3ebb3746f811cefb12a6e37241a 100644 (file)
--- a/test/CodeGen/X86/avx-splat.ll
+++ b/test/CodeGen/X86/avx-splat.ll
@@ -47,7 +47,7 @@ entry:
  ;   shuffle (scalar_to_vector (load (ptr + 4))), undef, <0, 0, 0, 0>
  ; To:
  ;   shuffle (vload ptr)), undef, <1, 1, 1, 1>
-; CHECK: vmovdqa
+; CHECK: vmovaps
  ; CHECK-NEXT: vinsertf128  $1
  ; CHECK-NEXT: vpermilps $-1
  define <8 x float> @funcE() nounwind {
diff --git a/test/CodeGen/X86/avx2-intrinsics-x86.ll b/test/CodeGen/X86/avx2-intrinsics-x86.ll

index bab7fb81e537f9490d4f0c7455f6ce2530974adc..a0f351de76086896d8a2a589472d4862193622e1 100644 (file)
--- a/test/CodeGen/X86/avx2-intrinsics-x86.ll
+++ b/test/CodeGen/X86/avx2-intrinsics-x86.ll
@@ -1046,3 +1046,13 @@ define <8 x i32> @test_x86_avx2_psrav_d_256(<8 x i32> %a0, <8 x i32> %a1) {
    ret <8 x i32> %res
  }
  declare <8 x i32> @llvm.x86.avx2.psrav.d.256(<8 x i32>, <8 x i32>) nounwind readnone
+
+; This is checked here because the execution dependency fix pass makes it hard to test in AVX mode since we don't have 256-bit integer instructions
+define void @test_x86_avx_storeu_dq_256(i8* %a0, <32 x i8> %a1) {
+  ; CHECK: vmovdqu
+  ; add operation forces the execution domain.
+  %a2 = add <32 x i8> %a1, <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>
+  call void @llvm.x86.avx.storeu.dq.256(i8* %a0, <32 x i8> %a2)
+  ret void
+}
+declare void @llvm.x86.avx.storeu.dq.256(i8*, <32 x i8>) nounwind
author	Craig Topper <craig.topper@gmail.com>
	Tue, 29 Nov 2011 05:37:58 +0000 (05:37 +0000)
committer	Craig Topper <craig.topper@gmail.com>
	Tue, 29 Nov 2011 05:37:58 +0000 (05:37 +0000)
lib/Target/X86/X86InstrInfo.cpp		patch \| blob \| history
lib/Target/X86/X86InstrSSE.td		patch \| blob \| history
test/CodeGen/X86/avx-cast.ll		patch \| blob \| history
test/CodeGen/X86/avx-intrinsics-x86.ll		patch \| blob \| history
test/CodeGen/X86/avx-splat.ll		patch \| blob \| history
test/CodeGen/X86/avx2-intrinsics-x86.ll		patch \| blob \| history