From e3b2bd1e79c9c9d24490b6ddb2341afcf4210691 Mon Sep 17 00:00:00 2001 From: Hans Wennborg Date: Mon, 22 Feb 2016 17:47:10 +0000 Subject: [PATCH] Merging r261384: ------------------------------------------------------------------------ r261384 | qcolombet | 2016-02-19 16:32:29 -0800 (Fri, 19 Feb 2016) | 4 lines [RegAllocFast] Properly track the physical register definitions on calls. PR26485 ------------------------------------------------------------------------ git-svn-id: https://llvm.org/svn/llvm-project/llvm/branches/release_38@261539 91177308-0d34-0410-b5e6-96231b3b80d8 --- lib/CodeGen/RegAllocFast.cpp | 10 ++++--- test/CodeGen/ARM/Windows/alloca.ll | 4 ++- test/CodeGen/X86/i386-tlscall-fastregalloc.ll | 26 +++++++++++++++++++ 3 files changed, 35 insertions(+), 5 deletions(-) create mode 100644 test/CodeGen/X86/i386-tlscall-fastregalloc.ll diff --git a/lib/CodeGen/RegAllocFast.cpp b/lib/CodeGen/RegAllocFast.cpp index f4c076fea0e..8d7a7213ba0 100644 --- a/lib/CodeGen/RegAllocFast.cpp +++ b/lib/CodeGen/RegAllocFast.cpp @@ -1002,11 +1002,13 @@ void RAFast::AllocateBasicBlock() { unsigned DefOpEnd = MI->getNumOperands(); if (MI->isCall()) { - // Spill all virtregs before a call. This serves two purposes: 1. If an + // Spill all virtregs before a call. This serves one purpose: If an // exception is thrown, the landing pad is going to expect to find - // registers in their spill slots, and 2. we don't have to wade through - // all the operands on the call instruction. - DefOpEnd = VirtOpEnd; + // registers in their spill slots. + // Note: although this is appealing to just consider all definitions + // as call-clobbered, this is not correct because some of those + // definitions may be used later on and we do not want to reuse + // those for virtual registers in between. DEBUG(dbgs() << " Spilling remaining registers before call.\n"); spillAll(MI); diff --git a/test/CodeGen/ARM/Windows/alloca.ll b/test/CodeGen/ARM/Windows/alloca.ll index 6a3d002ab3b..0f20ffbd36d 100644 --- a/test/CodeGen/ARM/Windows/alloca.ll +++ b/test/CodeGen/ARM/Windows/alloca.ll @@ -13,7 +13,9 @@ entry: } ; CHECK: bl num_entries -; CHECK: movs [[R1:r[0-9]+]], #7 +; Any register is actually valid here, but turns out we use lr, +; because we do not have the kill flag on R0. +; CHECK: mov.w [[R1:lr]], #7 ; CHECK: add.w [[R0:r[0-9]+]], [[R1]], [[R0]], lsl #2 ; CHECK: bic [[R0]], [[R0]], #7 ; CHECK: lsrs r4, [[R0]], #2 diff --git a/test/CodeGen/X86/i386-tlscall-fastregalloc.ll b/test/CodeGen/X86/i386-tlscall-fastregalloc.ll new file mode 100644 index 00000000000..775c0c1b378 --- /dev/null +++ b/test/CodeGen/X86/i386-tlscall-fastregalloc.ll @@ -0,0 +1,26 @@ +; RUN: llc %s -o - -O0 -regalloc=fast | FileCheck %s +target datalayout = "e-m:o-p:32:32-f64:32:64-f80:128-n8:16:32-S128" +target triple = "i386-apple-macosx10.10" + +@c = external global i8, align 1 +@p = thread_local global i8* null, align 4 + +; Check that regalloc fast correctly preserves EAX that is set by the TLS call +; until the actual use. +; PR26485. +; +; CHECK-LABEL: f: +; Get p. +; CHECK: movl _p@{{[0-9a-zA-Z]+}}, [[P_ADDR:%[a-z]+]] +; CHECK-NEXT: calll *([[P_ADDR]]) +; At this point eax contiains the address of p. +; Load c address. +; Make sure we do not clobber eax. +; CHECK-NEXT: movl L_c{{[^,]*}}, [[C_ADDR:%e[b-z]x+]] +; Store c address into p. +; CHECK-NEXT: movl [[C_ADDR]], (%eax) +define void @f() #0 { +entry: + store i8* @c, i8** @p, align 4 + ret void +} -- 2.34.1