Allocate virtual registers in ascending order.

author Jakob Stoklund Olesen <stoklund@2pi.dk>

Mon, 2 Apr 2012 22:30:39 +0000 (22:30 +0000)

committer Jakob Stoklund Olesen <stoklund@2pi.dk>

Mon, 2 Apr 2012 22:30:39 +0000 (22:30 +0000)
author Jakob Stoklund Olesen <stoklund@2pi.dk>
Mon, 2 Apr 2012 22:30:39 +0000 (22:30 +0000)
committer Jakob Stoklund Olesen <stoklund@2pi.dk>
Mon, 2 Apr 2012 22:30:39 +0000 (22:30 +0000)
diff --git a/lib/CodeGen/RegAllocGreedy.cpp b/lib/CodeGen/RegAllocGreedy.cpp

index f29a85287ba0fbfc3b6ffb6ca2695b2e7f9a64b3..d00259a6d91c07159886832ffe54fde5c7941094 100644 (file)
--- a/lib/CodeGen/RegAllocGreedy.cpp
+++ b/lib/CodeGen/RegAllocGreedy.cpp
@@ -428,13 +428,13 @@ void RAGreedy::enqueue(LiveInterval *LI) {
        Prio |= (1u << 30);
    }
  
-  Queue.push(std::make_pair(Prio, Reg));
+  Queue.push(std::make_pair(Prio, ~Reg));
  }
  
  LiveInterval *RAGreedy::dequeue() {
    if (Queue.empty())
      return 0;
-  LiveInterval *LI = &LIS->getInterval(Queue.top().second);
+  LiveInterval *LI = &LIS->getInterval(~Queue.top().second);
    Queue.pop();
    return LI;
  }
diff --git a/test/CodeGen/ARM/ldrd.ll b/test/CodeGen/ARM/ldrd.ll

index a588bc31535053bb0624a3d02d989186357bcacf..3f8fd75f49f943b1c7bb5157e6f57164eb113dfe 100644 (file)
--- a/test/CodeGen/ARM/ldrd.ll
+++ b/test/CodeGen/ARM/ldrd.ll
@@ -44,8 +44,7 @@ entry:
  ; BASIC: str
  ; GREEDY: @f
  ; GREEDY: %bb
-; GREEDY: ldr
-; GREEDY: ldr
+; GREEDY: ldrd
  ; GREEDY: str
  define void @f(i32* nocapture %a, i32* nocapture %b, i32 %n) nounwind {
  entry:
diff --git a/test/CodeGen/ARM/reg_asc_order.ll b/test/CodeGen/ARM/reg_asc_order.ll

new file mode 100644 (file)

index 0000000..d1d0ee5
--- /dev/null
+++ b/test/CodeGen/ARM/reg_asc_order.ll
@@ -0,0 +1,16 @@
+; RUN: llc < %s -march=arm -mcpu=cortex-a8 | FileCheck %s
+; Check that memcpy gets lowered to ldm/stm, at least in this very smple case.
+
+%struct.Foo = type { i32, i32, i32, i32 }
+
+define void @_Z10CopyStructP3FooS0_(%struct.Foo* nocapture %a, %struct.Foo* nocapture %b) nounwind {
+entry:
+;CHECK: ldm
+;CHECK: stm
+  %0 = bitcast %struct.Foo* %a to i8*
+  %1 = bitcast %struct.Foo* %b to i8*
+  tail call void @llvm.memcpy.p0i8.p0i8.i32(i8* %0, i8* %1, i32 16, i32 4, i1 false)
+  ret void
+}
+
+declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture, i32, i32, i1) nounwind
diff --git a/test/CodeGen/ARM/select.ll b/test/CodeGen/ARM/select.ll

index f1bd7ee53f8841e5a603a0cf6214548ed07bde4f..3e07da841a5aeb832fdbeddb93a6123330b36693 100644 (file)
--- a/test/CodeGen/ARM/select.ll
+++ b/test/CodeGen/ARM/select.ll
@@ -76,12 +76,12 @@ define double @f7(double %a, double %b) {
  ; block generated, odds are good that we have close to the ideal code for this:
  ;
  ; CHECK-NEON:      _f8:
-; CHECK-NEON:      adr     r2, LCPI7_0
-; CHECK-NEON-NEXT: movw    r3, #1123
-; CHECK-NEON-NEXT: adds    r1, r2, #4
-; CHECK-NEON-NEXT: cmp     r0, r3
+; CHECK-NEON:      adr     [[R2:r[0-9]+]], LCPI7_0
+; CHECK-NEON-NEXT: movw    [[R3:r[0-9]+]], #1123
+; CHECK-NEON-NEXT: adds    {{r.*}}, [[R2]], #4
+; CHECK-NEON-NEXT: cmp     r0, [[R3]]
  ; CHECK-NEON-NEXT: it      ne
-; CHECK-NEON-NEXT: movne   r1, r2
+; CHECK-NEON-NEXT: movne   {{r.*}}, [[R2]]
  ; CHECK-NEON-NEXT: ldr
  ; CHECK-NEON:      bx
  
diff --git a/test/CodeGen/X86/store_op_load_fold2.ll b/test/CodeGen/X86/store_op_load_fold2.ll

index 11686227ab9c4a4ddf9e6279369479a5b0f3faee..8313166a90cc3aba481ee203621aa0634bf607d4 100644 (file)
--- a/test/CodeGen/X86/store_op_load_fold2.ll
+++ b/test/CodeGen/X86/store_op_load_fold2.ll
@@ -1,4 +1,5 @@
-; RUN: llc < %s -mtriple=i686-linux -x86-asm-syntax=intel | FileCheck %s
+; RUN: llc < %s -mtriple=i686-linux -x86-asm-syntax=att | FileCheck %s -check-prefix=ATT
+; RUN: llc < %s -mtriple=i686-linux -x86-asm-syntax=intel | FileCheck %s -check-prefix=INTEL
  
  target datalayout = "e-p:32:32"
          %struct.Macroblock = type { i32, i32, i32, i32, i32, [8 x i32], %struct.Macroblock*, %struct.Macroblock*, i32, [2 x [4 x [4 x [2 x i32]]]], [16 x i8], [16 x i8], i32, i64, [4 x i32], [4 x i32], i64, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i16, double, i32, i32, i32, i32, i32, i32, i32, i32, i32 }
@@ -16,9 +17,14 @@ cond_true2732.preheader:                ; preds = %entry
          store i64 %tmp2676.us.us, i64* %tmp2666
          ret i32 0
  
-; CHECK:       and     {{E..}}, DWORD PTR [360]
-; CHECK:       and     DWORD PTR [356], {{E..}}
-; CHECK:       mov     DWORD PTR [360], {{E..}}
+; INTEL:       and     {{E..}}, DWORD PTR [360]
+; INTEL:       and     DWORD PTR [356], {{E..}}
+; FIXME:       mov     DWORD PTR [360], {{E..}}
+; The above line comes out as 'mov 360, EAX', but when the register is ECX it works?
+
+; ATT:         andl    360, %{{e..}}
+; ATT: andl    %{{e..}}, 356
+; ATT: movl    %{{e..}}, 360
  
  }
  
diff --git a/test/CodeGen/X86/vec_shuffle-37.ll b/test/CodeGen/X86/vec_shuffle-37.ll

index 65486cb80c9f14f276643196614a780009b83dc5..619652aff15842342f6bfab7f47f17b6fc0ddf83 100644 (file)
--- a/test/CodeGen/X86/vec_shuffle-37.ll
+++ b/test/CodeGen/X86/vec_shuffle-37.ll
@@ -4,10 +4,10 @@
  
  define <4 x i32> @t00(<4 x i32>* %a0) nounwind ssp {
  entry:
-; CHECK: movaps  ({{%rdi|%rcx}}), %xmm0
-; CHECK: movaps  %xmm0, %xmm1
-; CHECK-NEXT: movss   %xmm2, %xmm1
-; CHECK-NEXT: shufps  $36, %xmm1, %xmm0
+; CHECK: movaps  ({{%rdi|%rcx}}), %[[XMM0:xmm[0-9]+]]
+; CHECK: movaps  %[[XMM0]], %[[XMM1:xmm[0-9]+]]
+; CHECK-NEXT: movss   %xmm{{[0-9]+}}, %[[XMM1]]
+; CHECK-NEXT: shufps  $36, %[[XMM1]], %[[XMM0]]
    %0 = load <4 x i32>* undef, align 16
    %1 = load <4 x i32>* %a0, align 16
    %2 = shufflevector <4 x i32> %1, <4 x i32> %0, <4 x i32> <i32 0, i32 1, i32 2, i32 4>
author	Jakob Stoklund Olesen <stoklund@2pi.dk>
	Mon, 2 Apr 2012 22:30:39 +0000 (22:30 +0000)
committer	Jakob Stoklund Olesen <stoklund@2pi.dk>
	Mon, 2 Apr 2012 22:30:39 +0000 (22:30 +0000)
lib/CodeGen/RegAllocGreedy.cpp		patch \| blob \| history
test/CodeGen/ARM/ldrd.ll		patch \| blob \| history
test/CodeGen/ARM/reg_asc_order.ll	[new file with mode: 0644]	patch \| blob
test/CodeGen/ARM/select.ll		patch \| blob \| history
test/CodeGen/X86/store_op_load_fold2.ll		patch \| blob \| history
test/CodeGen/X86/vec_shuffle-37.ll		patch \| blob \| history