fix PR5436 by making the 'simple' case of SRoA not promote out of range

author Chris Lattner <sabre@nondot.org>

Fri, 27 Nov 2009 16:37:41 +0000 (16:37 +0000)

committer Chris Lattner <sabre@nondot.org>

Fri, 27 Nov 2009 16:37:41 +0000 (16:37 +0000)
author Chris Lattner <sabre@nondot.org>
Fri, 27 Nov 2009 16:37:41 +0000 (16:37 +0000)
committer Chris Lattner <sabre@nondot.org>
Fri, 27 Nov 2009 16:37:41 +0000 (16:37 +0000)
diff --git a/lib/Transforms/Scalar/ScalarReplAggregates.cpp b/lib/Transforms/Scalar/ScalarReplAggregates.cpp

index 047d279e8e292d53d6260ff9ae7b390b260c10f8..ae6ad74d54fde218070127827d7b4bd5a342b259 100644 (file)
--- a/lib/Transforms/Scalar/ScalarReplAggregates.cpp
+++ b/lib/Transforms/Scalar/ScalarReplAggregates.cpp
@@ -469,15 +469,41 @@ void SROA::isSafeElementUse(Value *Ptr, bool isFirstElt, AllocaInst *AI,
      case Instruction::GetElementPtr: {
        GetElementPtrInst *GEP = cast<GetElementPtrInst>(User);
        bool AreAllZeroIndices = isFirstElt;
-      if (GEP->getNumOperands() > 1) {
-        if (!isa<ConstantInt>(GEP->getOperand(1)) ||
-            !cast<ConstantInt>(GEP->getOperand(1))->isZero())
-          // Using pointer arithmetic to navigate the array.
-          return MarkUnsafe(Info);
-       
-        if (AreAllZeroIndices)
-          AreAllZeroIndices = GEP->hasAllZeroIndices();
+      if (GEP->getNumOperands() > 1 &&
+          (!isa<ConstantInt>(GEP->getOperand(1)) ||
+           !cast<ConstantInt>(GEP->getOperand(1))->isZero()))
+        // Using pointer arithmetic to navigate the array.
+        return MarkUnsafe(Info);
+      
+      // Verify that any array subscripts are in range.
+      for (gep_type_iterator GEPIt = gep_type_begin(GEP),
+           E = gep_type_end(GEP); GEPIt != E; ++GEPIt) {
+        // Ignore struct elements, no extra checking needed for these.
+        if (isa<StructType>(*GEPIt))
+          continue;
+
+        // This GEP indexes an array.  Verify that this is an in-range
+        // constant integer. Specifically, consider A[0][i]. We cannot know that
+        // the user isn't doing invalid things like allowing i to index an
+        // out-of-range subscript that accesses A[1].  Because of this, we have
+        // to reject SROA of any accesses into structs where any of the
+        // components are variables. 
+        ConstantInt *IdxVal = dyn_cast<ConstantInt>(GEPIt.getOperand());
+        if (!IdxVal) return MarkUnsafe(Info);
+        
+        // Are all indices still zero?
+        AreAllZeroIndices &= IdxVal->isZero();
+        
+        if (const ArrayType *AT = dyn_cast<ArrayType>(*GEPIt)) {
+          if (IdxVal->getZExtValue() >= AT->getNumElements())
+            return MarkUnsafe(Info);
+        } else if (const VectorType *VT = dyn_cast<VectorType>(*GEPIt)) {
+          if (IdxVal->getZExtValue() >= VT->getNumElements())
+            return MarkUnsafe(Info);
+        }
        }
+      
+      
        isSafeElementUse(GEP, AreAllZeroIndices, AI, Info);
        if (Info.isUnsafe) return;
        break;
diff --git a/test/Transforms/ScalarRepl/badarray.ll b/test/Transforms/ScalarRepl/badarray.ll

index decdd4bc29557e73ee00dadea516dc6c3313eaa3..3ec3c01b2836ed5c825da673dd6b2bcea8d02600 100644 (file)
--- a/test/Transforms/ScalarRepl/badarray.ll
+++ b/test/Transforms/ScalarRepl/badarray.ll
@@ -1,10 +1,14 @@
  ; RUN: opt < %s -scalarrepl -S | FileCheck %s
  
+target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-v64:64:64-v128:128:128-a0:0:64-f80:32:32-n8:16:32"
+target triple = "i386-pc-linux-gnu"
+
+
  ; PR3466
  ; Off end of array, don't transform.
  define i32 @test1() {
  ; CHECK: @test1
-; CHECK: %X = alloca
+; CHECK-NOT: = alloca
         %X = alloca [4 x i32]
         %Y = getelementptr [4 x i32]* %X, i64 0, i64 6          ; <i32*> [#uses=2]
         store i32 0, i32* %Y
@@ -17,9 +21,37 @@ define i32 @test1() {
  define i32 @test2() nounwind {
  entry:
  ; CHECK: @test2
-; CHECK: %yx2.i = alloca
+; CHECK-NOT: = alloca
          %yx2.i = alloca float, align 4          ; <float*> [#uses=1]            
          %yx26.i = bitcast float* %yx2.i to i64*         ; <i64*> [#uses=1]      
          %0 = load i64* %yx26.i, align 8         ; <i64> [#uses=0]               
          unreachable
  }
+
+%base = type { i32, [0 x i8] }
+%padded = type { %base, [1 x i32] }
+
+; PR5436
+define void @test3() {
+entry:
+; CHECK: @test3
+; CHECK-NOT: = alloca
+; CHECK: store i64
+  %var_1 = alloca %padded, align 8                ; <%padded*> [#uses=3]
+  %0 = getelementptr inbounds %padded* %var_1, i32 0, i32 0 ; <%base*> [#uses=2]
+  
+  %p2 = getelementptr inbounds %base* %0, i32 0, i32 1, i32 0 ; <i8*> [#uses=1]
+  store i8 72, i8* %p2, align 1
+  
+  ; 72 -> a[0].
+
+  %callret = call %padded *@test3f() ; <i32> [#uses=2]
+  %callretcast = bitcast %padded* %callret to i8*                     ; <i8*> [#uses=1]
+  %var_11 = bitcast %padded* %var_1 to i8*        ; <i8*> [#uses=1]
+  call void @llvm.memcpy.i32(i8* %callretcast, i8* %var_11, i32 8, i32 4)
+  ret void
+}
+
+declare void @llvm.memcpy.i32(i8* nocapture, i8* nocapture, i32, i32) nounwind
+
+declare %padded* @test3f()
author	Chris Lattner <sabre@nondot.org>
	Fri, 27 Nov 2009 16:37:41 +0000 (16:37 +0000)
committer	Chris Lattner <sabre@nondot.org>
	Fri, 27 Nov 2009 16:37:41 +0000 (16:37 +0000)
lib/Transforms/Scalar/ScalarReplAggregates.cpp		patch \| blob \| history
test/Transforms/ScalarRepl/badarray.ll		patch \| blob \| history