[dfsan] Introduce an optimization to reduce the number of union queries.

author Peter Collingbourne <peter@pcc.me.uk>

Tue, 15 Jul 2014 04:41:17 +0000 (04:41 +0000)

committer Peter Collingbourne <peter@pcc.me.uk>

Tue, 15 Jul 2014 04:41:17 +0000 (04:41 +0000)
author Peter Collingbourne <peter@pcc.me.uk>
Tue, 15 Jul 2014 04:41:17 +0000 (04:41 +0000)
committer Peter Collingbourne <peter@pcc.me.uk>
Tue, 15 Jul 2014 04:41:17 +0000 (04:41 +0000)
diff --git a/lib/Transforms/Instrumentation/DataFlowSanitizer.cpp b/lib/Transforms/Instrumentation/DataFlowSanitizer.cpp

index 0ea49c0a1908a8086a1653dee8bca512f7939d32..6419adc85a2e02373b02820b2f526a4d43dcf6a5 100644 (file)
--- a/lib/Transforms/Instrumentation/DataFlowSanitizer.cpp
+++ b/lib/Transforms/Instrumentation/DataFlowSanitizer.cpp
@@ -50,6 +50,7 @@
  #include "llvm/ADT/DepthFirstIterator.h"
  #include "llvm/ADT/StringExtras.h"
  #include "llvm/Analysis/ValueTracking.h"
+#include "llvm/IR/Dominators.h"
  #include "llvm/IR/IRBuilder.h"
  #include "llvm/IR/InlineAsm.h"
  #include "llvm/IR/InstVisitor.h"
@@ -265,6 +266,7 @@ class DataFlowSanitizer : public ModulePass {
  struct DFSanFunction {
    DataFlowSanitizer &DFS;
    Function *F;
+  DominatorTree DT;
    DataFlowSanitizer::InstrumentedABI IA;
    bool IsNativeABI;
    Value *ArgTLSPtr;
@@ -276,10 +278,19 @@ struct DFSanFunction {
    DenseSet<Instruction *> SkipInsts;
    DenseSet<Value *> NonZeroChecks;
  
+  struct CachedCombinedShadow {
+    BasicBlock *Block;
+    Value *Shadow;
+  };
+  DenseMap<std::pair<Value *, Value *>, CachedCombinedShadow>
+      CachedCombinedShadows;
+
    DFSanFunction(DataFlowSanitizer &DFS, Function *F, bool IsNativeABI)
        : DFS(DFS), F(F), IA(DFS.getInstrumentedABI()),
          IsNativeABI(IsNativeABI), ArgTLSPtr(nullptr), RetvalTLSPtr(nullptr),
-        LabelReturnAlloca(nullptr) {}
+        LabelReturnAlloca(nullptr) {
+    DT.recalculate(*F);
+  }
    Value *getArgTLSPtr();
    Value *getArgTLS(unsigned Index, Instruction *Pos);
    Value *getRetvalTLS();
@@ -880,6 +891,14 @@ Value *DFSanFunction::combineShadows(Value *V1, Value *V2, Instruction *Pos) {
      return V1;
    if (V1 == V2)
      return V1;
+
+  auto Key = std::make_pair(V1, V2);
+  if (V1 > V2)
+    std::swap(Key.first, Key.second);
+  CachedCombinedShadow &CCS = CachedCombinedShadows[Key];
+  if (CCS.Block && DT.dominates(CCS.Block, Pos->getParent()))
+    return CCS.Shadow;
+
    IRBuilder<> IRB(Pos);
    BasicBlock *Head = Pos->getParent();
    Value *Ne = IRB.CreateICmpNE(V1, V2);
@@ -895,6 +914,9 @@ Value *DFSanFunction::combineShadows(Value *V1, Value *V2, Instruction *Pos) {
    PHINode *Phi = PHINode::Create(DFS.ShadowTy, 2, "", Tail->begin());
    Phi->addIncoming(Call, Call->getParent());
    Phi->addIncoming(V1, Head);
+
+  CCS.Block = Tail;
+  CCS.Shadow = Phi;
    return Phi;
  }
  
@@ -988,16 +1010,27 @@ Value *DFSanFunction::loadShadow(Value *Addr, uint64_t Size, uint64_t Align,
  
      BasicBlock *Head = Pos->getParent();
      BasicBlock *Tail = Head->splitBasicBlock(Pos);
+
+    if (DomTreeNode *OldNode = DT.getNode(Head)) {
+      std::vector<DomTreeNode *> Children(OldNode->begin(), OldNode->end());
+
+      DomTreeNode *NewNode = DT.addNewBlock(Tail, Head);
+      for (auto Child : Children)
+        DT.changeImmediateDominator(Child, NewNode);
+    }
+
      // In the following code LastBr will refer to the previous basic block's
      // conditional branch instruction, whose true successor is fixed up to point
      // to the next block during the loop below or to the tail after the final
      // iteration.
      BranchInst *LastBr = BranchInst::Create(FallbackBB, FallbackBB, ShadowsEq);
      ReplaceInstWithInst(Head->getTerminator(), LastBr);
+    DT.addNewBlock(FallbackBB, Head);
  
      for (uint64_t Ofs = 64 / DFS.ShadowWidth; Ofs != Size;
           Ofs += 64 / DFS.ShadowWidth) {
        BasicBlock *NextBB = BasicBlock::Create(*DFS.Ctx, "", F);
+      DT.addNewBlock(NextBB, LastBr->getParent());
        IRBuilder<> NextIRB(NextBB);
        WideAddr = NextIRB.CreateGEP(WideAddr, ConstantInt::get(DFS.IntptrTy, 1));
        Value *NextWideShadow = NextIRB.CreateAlignedLoad(WideAddr, ShadowAlign);
diff --git a/test/Instrumentation/DataFlowSanitizer/union.ll b/test/Instrumentation/DataFlowSanitizer/union.ll

new file mode 100644 (file)

index 0000000..30162e7
--- /dev/null
+++ b/test/Instrumentation/DataFlowSanitizer/union.ll
@@ -0,0 +1,41 @@
+; RUN: opt < %s -dfsan -S | FileCheck %s
+target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
+
+@a = common global i32 0
+@b = common global i32 0
+
+; Check that we reuse unions where possible.
+
+; CHECK-LABEL: @"dfs$f"
+define void @f(i32 %x, i32 %y) {
+  ; CHECK: __dfsan_union
+  %xay = add i32 %x, %y
+  store i32 %xay, i32* @a
+  ; CHECK-NOT: __dfsan_union
+  %xmy = mul i32 %x, %y
+  store i32 %xmy, i32* @b
+  ret void
+}
+
+; In this case, we compute the unions on both sides because neither block
+; dominates the other.
+
+; CHECK-LABEL: @"dfs$g"
+define void @g(i1 %p, i32 %x, i32 %y) {
+  br i1 %p, label %l1, label %l2
+
+l1:
+  ; CHECK: __dfsan_union
+  %xay = add i32 %x, %y
+  store i32 %xay, i32* @a
+  br label %l3
+
+l2:
+  ; CHECK: __dfsan_union
+  %xmy = mul i32 %x, %y
+  store i32 %xmy, i32* @b
+  br label %l3
+
+l3:
+  ret void
+}
author	Peter Collingbourne <peter@pcc.me.uk>
	Tue, 15 Jul 2014 04:41:17 +0000 (04:41 +0000)
committer	Peter Collingbourne <peter@pcc.me.uk>
	Tue, 15 Jul 2014 04:41:17 +0000 (04:41 +0000)
lib/Transforms/Instrumentation/DataFlowSanitizer.cpp		patch \| blob \| history
test/Instrumentation/DataFlowSanitizer/union.ll	[new file with mode: 0644]	patch \| blob