Fix PR7162: Use source register classes and sub-indices to determine the correct...

author Evan Cheng <evan.cheng@apple.com>

Tue, 18 May 2010 20:03:28 +0000 (20:03 +0000)

committer Evan Cheng <evan.cheng@apple.com>

Tue, 18 May 2010 20:03:28 +0000 (20:03 +0000)
author Evan Cheng <evan.cheng@apple.com>
Tue, 18 May 2010 20:03:28 +0000 (20:03 +0000)
committer Evan Cheng <evan.cheng@apple.com>
Tue, 18 May 2010 20:03:28 +0000 (20:03 +0000)
diff --git a/lib/CodeGen/SelectionDAG/InstrEmitter.cpp b/lib/CodeGen/SelectionDAG/InstrEmitter.cpp

index 16bd40ca65a797e14ef0ccefaf7ed46700356cac..2f8f255b5b55fd6eac51aef223a7d99010ec00f3 100644 (file)
--- a/lib/CodeGen/SelectionDAG/InstrEmitter.cpp
+++ b/lib/CodeGen/SelectionDAG/InstrEmitter.cpp
@@ -545,16 +545,18 @@ void InstrEmitter::EmitRegSequence(SDNode *Node,
    const TargetInstrDesc &II = TII->get(TargetOpcode::REG_SEQUENCE);
    for (unsigned i = 0; i != NumOps; ++i) {
      SDValue Op = Node->getOperand(i);
-#ifndef NDEBUG
      if (i & 1) {
        unsigned SubIdx = cast<ConstantSDNode>(Op)->getZExtValue();
        unsigned SubReg = getVR(Node->getOperand(i-1), VRBaseMap);
        const TargetRegisterClass *TRC = MRI->getRegClass(SubReg);
        const TargetRegisterClass *SRC =
-        getSuperRegisterRegClass(TRC, SubIdx, Node->getValueType(0));
-      assert(SRC == RC && "Invalid subregister index in REG_SEQUENCE");
+        TRI->getMatchingSuperRegClass(RC, TRC, SubIdx);
+      //getSuperRegisterRegClass(TRC, SubIdx, Node->getValueType(0));
+      if (!SRC)
+        llvm_unreachable("Invalid subregister index in REG_SEQUENCE");
+      if (SRC != RC)
+        MRI->setRegClass(NewVReg, SRC);
      }
-#endif
      AddOperand(MI, Op, i+1, &II, VRBaseMap, /*IsDebug=*/false,
                 IsClone, IsCloned);
    }
diff --git a/test/CodeGen/ARM/reg_sequence.ll b/test/CodeGen/ARM/reg_sequence.ll

index f74f8da08640663245a4a389e7c84ba4e3f5973a..540bfcabfeafc1771eae432e2de06b45b15546bf 100644 (file)
--- a/test/CodeGen/ARM/reg_sequence.ll
+++ b/test/CodeGen/ARM/reg_sequence.ll
@@ -264,6 +264,44 @@ define arm_aapcs_vfpcc float @t9(%0* nocapture, %3* nocapture) nounwind {
    ret float 9.990000e+02
  }
  
+; PR7162
+define arm_aapcs_vfpcc i32 @t10() nounwind {
+entry:
+; CHECK: t10:
+; CHECK: vmov.i32 q1, #0x3F000000
+; CHECK: vdup.32 q0, d0[0]
+; CHECK: vmov d0, d1
+; CHECK: vmla.f32 q0, q0, d0[0]
+  %0 = shufflevector <4 x float> zeroinitializer, <4 x float> undef, <4 x i32> zeroinitializer ; <<4 x float>> [#uses=1]
+  %1 = insertelement <4 x float> %0, float undef, i32 1 ; <<4 x float>> [#uses=1]
+  %2 = insertelement <4 x float> %1, float undef, i32 2 ; <<4 x float>> [#uses=1]
+  %3 = insertelement <4 x float> %2, float undef, i32 3 ; <<4 x float>> [#uses=1]
+  %tmp54.i = bitcast <4 x float> %3 to <2 x double> ; <<2 x double>> [#uses=1]
+  %4 = extractelement <2 x double> %tmp54.i, i32 1 ; <double> [#uses=1]
+  %5 = bitcast double %4 to <2 x float>           ; <<2 x float>> [#uses=1]
+  %6 = shufflevector <2 x float> %5, <2 x float> undef, <4 x i32> zeroinitializer ; <<4 x float>> [#uses=1]
+  %7 = fmul <4 x float> undef, %6                 ; <<4 x float>> [#uses=1]
+  %8 = fadd <4 x float> %7, undef                 ; <<4 x float>> [#uses=1]
+  %9 = fadd <4 x float> %8, undef                 ; <<4 x float>> [#uses=1]
+  %10 = shufflevector <4 x float> undef, <4 x float> %9, <4 x i32> <i32 0, i32 1, i32 2, i32 7> ; <<4 x float>> [#uses=1]
+  %11 = fmul <4 x float> %10, <float 5.000000e-01, float 5.000000e-01, float 5.000000e-01, float 5.000000e-01> ; <<4 x float>> [#uses=1]
+  %12 = shufflevector <4 x float> %11, <4 x float> undef, <4 x i32> <i32 3, i32 undef, i32 undef, i32 undef> ; <<4 x float>> [#uses=1]
+  %13 = shufflevector <4 x float> %12, <4 x float> undef, <4 x i32> zeroinitializer ; <<4 x float>> [#uses=1]
+  %14 = fmul <4 x float> %13, undef               ; <<4 x float>> [#uses=1]
+  %15 = fadd <4 x float> undef, %14               ; <<4 x float>> [#uses=1]
+  %16 = shufflevector <4 x float> undef, <4 x float> %15, <4 x i32> <i32 0, i32 1, i32 6, i32 3> ; <<4 x float>> [#uses=1]
+  %17 = fmul <4 x float> %16, undef               ; <<4 x float>> [#uses=1]
+  %18 = extractelement <4 x float> %17, i32 2     ; <float> [#uses=1]
+  store float %18, float* undef, align 4
+  br i1 undef, label %exit, label %bb14
+
+exit:          ; preds = %bb.i19
+  unreachable
+
+bb14:                                             ; preds = %bb6
+  ret i32 0
+}
+
  declare <4 x i32> @llvm.arm.neon.vld1.v4i32(i8*) nounwind readonly
  
  declare <8 x i16> @llvm.arm.neon.vld1.v8i16(i8*) nounwind readonly
author	Evan Cheng <evan.cheng@apple.com>
	Tue, 18 May 2010 20:03:28 +0000 (20:03 +0000)
committer	Evan Cheng <evan.cheng@apple.com>
	Tue, 18 May 2010 20:03:28 +0000 (20:03 +0000)
lib/CodeGen/SelectionDAG/InstrEmitter.cpp		patch \| blob \| history
test/CodeGen/ARM/reg_sequence.ll		patch \| blob \| history