lib/Transforms/IPO/OldPoolAllocate.cpp

   1 //===-- PoolAllocate.cpp - Pool Allocation Pass ---------------------------===//
   2 //
   3 // This transform changes programs so that disjoint data structures are
   4 // allocated out of different pools of memory, increasing locality and shrinking
   5 // pointer size.
   6 //
   7 //===----------------------------------------------------------------------===//
   8
   9 #include "llvm/Transforms/IPO/PoolAllocate.h"
  10 #include "llvm/Transforms/CloneFunction.h"
  11 #include "llvm/Analysis/DataStructure.h"
  12 #include "llvm/Analysis/DataStructureGraph.h"
  13 #include "llvm/Pass.h"
  14 #include "llvm/Module.h"
  15 #include "llvm/Function.h"
  16 #include "llvm/iMemory.h"
  17 #include "llvm/iTerminators.h"
  18 #include "llvm/iOther.h"
  19 #include "llvm/ConstantVals.h"
  20 #include "llvm/Target/TargetData.h"
  21 #include "llvm/Support/InstVisitor.h"
  22 #include "Support/DepthFirstIterator.h"
  23 #include "Support/STLExtras.h"
  24 #include <algorithm>
  25
  26
  27 // FIXME: This is dependant on the sparc backend layout conventions!!
  28 static TargetData TargetData("test");
  29
  30 namespace {
  31   // ScalarInfo - Information about an LLVM value that we know points to some
  32   // datastructure we are processing.
  33   //
  34   struct ScalarInfo {
  35     Value  *Val;            // Scalar value in Current Function
  36     DSNode *Node;           // DataStructure node it points to
  37     Value  *PoolHandle;     // PoolTy* LLVM value
  38
  39     ScalarInfo(Value *V, DSNode *N, Value *PH)
  40       : Val(V), Node(N), PoolHandle(PH) {
  41       assert(V && N && PH && "Null value passed to ScalarInfo ctor!");
  42     }
  43   };
  44
  45   // CallArgInfo - Information on one operand for a call that got expanded.
  46   struct CallArgInfo {
  47     int ArgNo;          // Call argument number this corresponds to
  48     DSNode *Node;       // The graph node for the pool
  49     Value *PoolHandle;  // The LLVM value that is the pool pointer
  50
  51     CallArgInfo(int Arg, DSNode *N, Value *PH)
  52       : ArgNo(Arg), Node(N), PoolHandle(PH) {
  53       assert(Arg >= -1 && N && PH && "Illegal values to CallArgInfo ctor!");
  54     }
  55
  56     // operator< when sorting, sort by argument number.
  57     bool operator<(const CallArgInfo &CAI) const {
  58       return ArgNo < CAI.ArgNo;
  59     }
  60   };
  61
  62   // TransformFunctionInfo - Information about how a function eeds to be
  63   // transformed.
  64   //
  65   struct TransformFunctionInfo {
  66     // ArgInfo - Maintain information about the arguments that need to be
  67     // processed.  Each pair corresponds to an argument (whose number is the
  68     // first element) that needs to have a pool pointer (the second element)
  69     // passed into the transformed function with it.
  70     //
  71     // As a special case, "argument" number -1 corresponds to the return value.
  72     //
  73     vector<CallArgInfo> ArgInfo;
  74
  75     // Func - The function to be transformed...
  76     Function *Func;
  77
  78     // The call instruction that is used to map CallArgInfo PoolHandle values
  79     // into the new function values.
  80     CallInst *Call;
  81
  82     // default ctor...
  83     TransformFunctionInfo() : Func(0), Call(0) {}
  84
  85     bool operator<(const TransformFunctionInfo &TFI) const {
  86       if (Func < TFI.Func) return true;
  87       if (Func > TFI.Func) return false;
  88       if (ArgInfo.size() < TFI.ArgInfo.size()) return true;
  89       if (ArgInfo.size() > TFI.ArgInfo.size()) return false;
  90       return ArgInfo < TFI.ArgInfo;
  91     }
  92
  93     void finalizeConstruction() {
  94       // Sort the vector so that the return value is first, followed by the
  95       // argument records, in order.  Note that this must be a stable sort so
  96       // that the entries with the same sorting criteria (ie they are multiple
  97       // pool entries for the same argument) are kept in depth first order.
  98       stable_sort(ArgInfo.begin(), ArgInfo.end());
  99     }
 100   };
 101
 102
 103   // Define the pass class that we implement...
 104   class PoolAllocate : public Pass {
 105     // PoolTy - The type of a scalar value that contains a pool pointer.
 106     PointerType *PoolTy;
 107   public:
 108
 109     PoolAllocate() {
 110       // Initialize the PoolTy instance variable, since the type never changes.
 111       vector<const Type*> PoolElements;
 112       PoolElements.push_back(PointerType::get(Type::SByteTy));
 113       PoolElements.push_back(Type::UIntTy);
 114       PoolTy = PointerType::get(StructType::get(PoolElements));
 115       // PoolTy = { sbyte*, uint }*
 116
 117       CurModule = 0; DS = 0;
 118       PoolInit = PoolDestroy = PoolAlloc = PoolFree = 0;
 119     }
 120
 121     bool run(Module *M);
 122
 123     // getAnalysisUsageInfo - This function requires data structure information
 124     // to be able to see what is pool allocatable.
 125     //
 126     virtual void getAnalysisUsageInfo(Pass::AnalysisSet &Required,
 127                                       Pass::AnalysisSet &,Pass::AnalysisSet &) {
 128       Required.push_back(DataStructure::ID);
 129     }
 130
 131   public:
 132     // CurModule - The module being processed.
 133     Module *CurModule;
 134
 135     // DS - The data structure graph for the module being processed.
 136     DataStructure *DS;
 137
 138     // Prototypes that we add to support pool allocation...
 139     Function *PoolInit, *PoolDestroy, *PoolAlloc, *PoolFree;
 140
 141     // The map of already transformed functions... note that the keys of this
 142     // map do not have meaningful values for 'Call' or the 'PoolHandle' elements
 143     // of the ArgInfo elements.
 144     //
 145     map<TransformFunctionInfo, Function*> TransformedFunctions;
 146
 147     // getTransformedFunction - Get a transformed function, or return null if
 148     // the function specified hasn't been transformed yet.
 149     //
 150     Function *getTransformedFunction(TransformFunctionInfo &TFI) const {
 151       map<TransformFunctionInfo, Function*>::const_iterator I =
 152         TransformedFunctions.find(TFI);
 153       if (I != TransformedFunctions.end()) return I->second;
 154       return 0;
 155     }
 156
 157
 158     // addPoolPrototypes - Add prototypes for the pool methods to the specified
 159     // module and update the Pool* instance variables to point to them.
 160     //
 161     void addPoolPrototypes(Module *M);
 162
 163
 164     // CreatePools - Insert instructions into the function we are processing to
 165     // create all of the memory pool objects themselves.  This also inserts
 166     // destruction code.  Add an alloca for each pool that is allocated to the
 167     // PoolDescriptors map.
 168     //
 169     void CreatePools(Function *F, const vector<AllocDSNode*> &Allocs,
 170                      map<DSNode*, Value*> &PoolDescriptors);
 171
 172     // processFunction - Convert a function to use pool allocation where
 173     // available.
 174     //
 175     bool processFunction(Function *F);
 176
 177     // transformFunctionBody - This transforms the instruction in 'F' to use the
 178     // pools specified in PoolDescriptors when modifying data structure nodes
 179     // specified in the PoolDescriptors map.  IPFGraph is the closed data
 180     // structure graph for F, of which the PoolDescriptor nodes come from.
 181     //
 182     void transformFunctionBody(Function *F, FunctionDSGraph &IPFGraph,
 183                                map<DSNode*, Value*> &PoolDescriptors);
 184
 185     // transformFunction - Transform the specified function the specified way.
 186     // It we have already transformed that function that way, don't do anything.
 187     // The nodes in the TransformFunctionInfo come out of callers data structure
 188     // graph.
 189     //
 190     void transformFunction(TransformFunctionInfo &TFI,
 191                            FunctionDSGraph &CallerIPGraph);
 192
 193   };
 194 }
 195
 196
 197
 198 // isNotPoolableAlloc - This is a predicate that returns true if the specified
 199 // allocation node in a data structure graph is eligable for pool allocation.
 200 //
 201 static bool isNotPoolableAlloc(const AllocDSNode *DS) {
 202   if (DS->isAllocaNode()) return true;  // Do not pool allocate alloca's.
 203
 204   MallocInst *MI = cast<MallocInst>(DS->getAllocation());
 205   if (MI->isArrayAllocation() && !isa<Constant>(MI->getArraySize()))
 206     return true;   // Do not allow variable size allocations...
 207
 208   return false;
 209 }
 210
 211 // processFunction - Convert a function to use pool allocation where
 212 // available.
 213 //
 214 bool PoolAllocate::processFunction(Function *F) {
 215   // Get the closed datastructure graph for the current function... if there are
 216   // any allocations in this graph that are not escaping, we need to pool
 217   // allocate them here!
 218   //
 219   FunctionDSGraph &IPGraph = DS->getClosedDSGraph(F);
 220
 221   // Get all of the allocations that do not escape the current function.  Since
 222   // they are still live (they exist in the graph at all), this means we must
 223   // have scalar references to these nodes, but the scalars are never returned.
 224   //
 225   vector<AllocDSNode*> Allocs;
 226   IPGraph.getNonEscapingAllocations(Allocs);
 227
 228   // Filter out allocations that we cannot handle.  Currently, this includes
 229   // variable sized array allocations and alloca's (which we do not want to
 230   // pool allocate)
 231   //
 232   Allocs.erase(remove_if(Allocs.begin(), Allocs.end(), isNotPoolableAlloc),
 233                Allocs.end());
 234
 235
 236   if (Allocs.empty()) return false;  // Nothing to do.
 237
 238   // Insert instructions into the function we are processing to create all of
 239   // the memory pool objects themselves.  This also inserts destruction code.
 240   // This fills in the PoolDescriptors map to associate the alloc node with the
 241   // allocation of the memory pool corresponding to it.
 242   //
 243   map<DSNode*, Value*> PoolDescriptors;
 244   CreatePools(F, Allocs, PoolDescriptors);
 245
 246   // Now we need to figure out what called methods we need to transform, and
 247   // how.  To do this, we look at all of the scalars, seeing which functions are
 248   // either used as a scalar value (so they return a data structure), or are
 249   // passed one of our scalar values.
 250   //
 251   transformFunctionBody(F, IPGraph, PoolDescriptors);
 252
 253   return true;
 254 }
 255
 256
 257 class FunctionBodyTransformer : public InstVisitor<FunctionBodyTransformer> {
 258   PoolAllocate &PoolAllocator;
 259   vector<ScalarInfo> &Scalars;
 260   map<CallInst*, TransformFunctionInfo> &CallMap;
 261
 262   const ScalarInfo &getScalar(const Value *V) {
 263     for (unsigned i = 0, e = Scalars.size(); i != e; ++i)
 264       if (Scalars[i].Val == V) return Scalars[i];
 265     assert(0 && "Scalar not found in getScalar!");
 266     abort();
 267     return Scalars[0];
 268   }
 269
 270   // updateScalars - Map the scalars array entries that look like 'From' to look
 271   // like 'To'.
 272   //
 273   void updateScalars(Value *From, Value *To) {
 274     for (unsigned i = 0, e = Scalars.size(); i != e; ++i)
 275       if (Scalars[i].Val == From) Scalars[i].Val = To;
 276   }
 277
 278 public:
 279   FunctionBodyTransformer(PoolAllocate &PA, vector<ScalarInfo> &S,
 280                           map<CallInst*, TransformFunctionInfo> &C)
 281     : PoolAllocator(PA), Scalars(S), CallMap(C) {}
 282
 283   void visitMemAccessInst(MemAccessInst *MAI) {
 284     // Don't do anything to load, store, or GEP yet...
 285   }
 286
 287   // Convert a malloc instruction into a call to poolalloc
 288   void visitMallocInst(MallocInst *I) {
 289     const ScalarInfo &SC = getScalar(I);
 290     BasicBlock *BB = I->getParent();
 291     BasicBlock::iterator MI = find(BB->begin(), BB->end(), I);
 292     BB->getInstList().remove(MI);  // Remove the Malloc instruction from the BB
 293
 294     // Create a new call to poolalloc before the malloc instruction
 295     vector<Value*> Args;
 296     Args.push_back(SC.PoolHandle);
 297     CallInst *Call = new CallInst(PoolAllocator.PoolAlloc, Args, I->getName());
 298     MI = BB->getInstList().insert(MI, Call)+1;
 299
 300     // If the type desired is not void*, cast it now...
 301     Value *Ptr = Call;
 302     if (Call->getType() != I->getType()) {
 303       CastInst *CI = new CastInst(Ptr, I->getType(), I->getName());
 304       BB->getInstList().insert(MI, CI);
 305       Ptr = CI;
 306     }
 307
 308     // Change everything that used the malloc to now use the pool alloc...
 309     I->replaceAllUsesWith(Ptr);
 310
 311     // Update the scalars array...
 312     updateScalars(I, Ptr);
 313
 314     // Delete the instruction now.
 315     delete I;
 316   }
 317
 318   // Convert the free instruction into a call to poolfree
 319   void visitFreeInst(FreeInst *I) {
 320     Value *Ptr = I->getOperand(0);
 321     const ScalarInfo &SC = getScalar(Ptr);
 322     BasicBlock *BB = I->getParent();
 323     BasicBlock::iterator FI = find(BB->begin(), BB->end(), I);
 324
 325     // If the value is not an sbyte*, convert it now!
 326     if (Ptr->getType() != PointerType::get(Type::SByteTy)) {
 327       CastInst *CI = new CastInst(Ptr, PointerType::get(Type::SByteTy),
 328                                   Ptr->getName());
 329       FI = BB->getInstList().insert(FI, CI)+1;
 330       Ptr = CI;
 331     }
 332
 333     // Create a new call to poolfree before the free instruction
 334     vector<Value*> Args;
 335     Args.push_back(SC.PoolHandle);
 336     Args.push_back(Ptr);
 337     CallInst *Call = new CallInst(PoolAllocator.PoolFree, Args);
 338     FI = BB->getInstList().insert(FI, Call)+1;
 339
 340     // Remove the old free instruction...
 341     delete BB->getInstList().remove(FI);
 342   }
 343
 344   // visitCallInst - Create a new call instruction with the extra arguments for
 345   // all of the memory pools that the call needs.
 346   //
 347   void visitCallInst(CallInst *I) {
 348     TransformFunctionInfo &TI = CallMap[I];
 349     BasicBlock *BB = I->getParent();
 350     BasicBlock::iterator CI = find(BB->begin(), BB->end(), I);
 351     BB->getInstList().remove(CI);  // Remove the old call instruction
 352
 353     // Start with all of the old arguments...
 354     vector<Value*> Args(I->op_begin()+1, I->op_end());
 355
 356     // Add all of the pool arguments...
 357     for (unsigned i = 0, e = TI.ArgInfo.size(); i != e; ++i)
 358       Args.push_back(TI.ArgInfo[i].PoolHandle);
 359
 360     Function *NF = PoolAllocator.getTransformedFunction(TI);
 361     CallInst *NewCall = new CallInst(NF, Args, I->getName());
 362     BB->getInstList().insert(CI, NewCall);
 363
 364     // Change everything that used the malloc to now use the pool alloc...
 365     if (I->getType() != Type::VoidTy) {
 366       I->replaceAllUsesWith(NewCall);
 367
 368       // Update the scalars array...
 369       updateScalars(I, NewCall);
 370     }
 371
 372     delete I;  // Delete the old call instruction now...
 373   }
 374
 375   void visitPHINode(PHINode *PN) {
 376     // Handle PHI Node
 377   }
 378
 379   void visitReturnInst(ReturnInst *I) {
 380     // Nothing of interest
 381   }
 382
 383   void visitInstruction(Instruction *I) {
 384     cerr << "Unknown instruction to FunctionBodyTransformer:\n";
 385     I->dump();
 386   }
 387
 388 };
 389
 390
 391 static void addCallInfo(TransformFunctionInfo &TFI, CallInst *CI, int Arg,
 392                         DSNode *GraphNode,
 393                         map<DSNode*, Value*> &PoolDescriptors) {
 394
 395   // For now, add the entire graph that is pointed to by the call argument.
 396   // This graph can and should be pruned to only what the function itself will
 397   // use, because often this will be a dramatically smaller subset of what we
 398   // are providing.
 399   //
 400   for (df_iterator<DSNode*> I = df_begin(GraphNode), E = df_end(GraphNode);
 401        I != E; ++I) {
 402     TFI.ArgInfo.push_back(CallArgInfo(Arg, *I, PoolDescriptors[*I]));
 403   }
 404
 405   assert(CI->getCalledFunction() && "Cannot handle indirect calls yet!");
 406   assert(TFI.Func == 0 || TFI.Func == CI->getCalledFunction() &&
 407          "Function call record should always call the same function!");
 408   assert(TFI.Call == 0 || TFI.Call == CI &&
 409          "Call element already filled in with different value!");
 410   TFI.Func = CI->getCalledFunction();
 411   TFI.Call = CI;
 412 }
 413
 414
 415 // transformFunctionBody - This transforms the instruction in 'F' to use the
 416 // pools specified in PoolDescriptors when modifying data structure nodes
 417 // specified in the PoolDescriptors map.  Specifically, scalar values specified
 418 // in the Scalars vector must be remapped.  IPFGraph is the closed data
 419 // structure graph for F, of which the PoolDescriptor nodes come from.
 420 //
 421 void PoolAllocate::transformFunctionBody(Function *F, FunctionDSGraph &IPFGraph,
 422                                        map<DSNode*, Value*> &PoolDescriptors) {
 423
 424   // Loop through the value map looking for scalars that refer to nonescaping
 425   // allocations.  Add them to the Scalars vector.  Note that we may have
 426   // multiple entries in the Scalars vector for each value if it points to more
 427   // than one object.
 428   //
 429   map<Value*, PointerValSet> &ValMap = IPFGraph.getValueMap();
 430   vector<ScalarInfo> Scalars;
 431
 432   cerr << "Building scalar map:\n";
 433
 434   for (map<Value*, PointerValSet>::iterator I = ValMap.begin(),
 435          E = ValMap.end(); I != E; ++I) {
 436     const PointerValSet &PVS = I->second;  // Set of things pointed to by scalar
 437
 438     cerr << "Scalar Mapping from:"; I->first->dump();
 439     cerr << "\nScalar Mapping to: "; PVS.print(cerr);
 440
 441     assert(PVS.size() == 1 &&
 442            "Only handle scalars that point to one thing so far!");
 443
 444     // Check to see if the scalar points to a data structure node...
 445     for (unsigned i = 0, e = PVS.size(); i != e; ++i) {
 446       assert(PVS[i].Index == 0 && "Nonzero not handled yet!");
 447
 448       // If the allocation is in the nonescaping set...
 449       map<DSNode*, Value*>::iterator AI = PoolDescriptors.find(PVS[i].Node);
 450       if (AI != PoolDescriptors.end()) // Add it to the list of scalars
 451         Scalars.push_back(ScalarInfo(I->first, PVS[i].Node, AI->second));
 452     }
 453   }
 454
 455
 456
 457   cerr << "\nIn '" << F->getName()
 458        << "': Found the following values that point to poolable nodes:\n";
 459
 460   for (unsigned i = 0, e = Scalars.size(); i != e; ++i)
 461     Scalars[i].Val->dump();
 462
 463   // CallMap - Contain an entry for every call instruction that needs to be
 464   // transformed.  Each entry in the map contains information about what we need
 465   // to do to each call site to change it to work.
 466   //
 467   map<CallInst*, TransformFunctionInfo> CallMap;
 468
 469   // Now we need to figure out what called methods we need to transform, and
 470   // how.  To do this, we look at all of the scalars, seeing which functions are
 471   // either used as a scalar value (so they return a data structure), or are
 472   // passed one of our scalar values.
 473   //
 474   for (unsigned i = 0, e = Scalars.size(); i != e; ++i) {
 475     Value *ScalarVal = Scalars[i].Val;
 476
 477     // Check to see if the scalar _IS_ a call...
 478     if (CallInst *CI = dyn_cast<CallInst>(ScalarVal))
 479       // If so, add information about the pool it will be returning...
 480       addCallInfo(CallMap[CI], CI, -1, Scalars[i].Node, PoolDescriptors);
 481
 482     // Check to see if the scalar is an operand to a call...
 483     for (Value::use_iterator UI = ScalarVal->use_begin(),
 484            UE = ScalarVal->use_end(); UI != UE; ++UI) {
 485       if (CallInst *CI = dyn_cast<CallInst>(*UI)) {
 486         // Find out which operand this is to the call instruction...
 487         User::op_iterator OI = find(CI->op_begin(), CI->op_end(), ScalarVal);
 488         assert(OI != CI->op_end() && "Call on use list but not an operand!?");
 489         assert(OI != CI->op_begin() && "Pointer operand is call destination?");
 490
 491         // FIXME: This is broken if the same pointer is passed to a call more
 492         // than once!  It will get multiple entries for the first pointer.
 493
 494         // Add the operand number and pool handle to the call table...
 495         addCallInfo(CallMap[CI], CI, OI-CI->op_begin()-1, Scalars[i].Node,
 496                     PoolDescriptors);
 497       }
 498     }
 499   }
 500
 501   // Print out call map...
 502   for (map<CallInst*, TransformFunctionInfo>::iterator I = CallMap.begin();
 503        I != CallMap.end(); ++I) {
 504     cerr << "\nFor call: ";
 505     I->first->dump();
 506     I->second.finalizeConstruction();
 507     cerr << I->second.Func->getName() << " must pass pool pointer for args #";
 508     for (unsigned i = 0; i < I->second.ArgInfo.size(); ++i)
 509       cerr << I->second.ArgInfo[i].ArgNo << ", ";
 510     cerr << "\n";
 511   }
 512
 513   // Loop through all of the call nodes, recursively creating the new functions
 514   // that we want to call...  This uses a map to prevent infinite recursion and
 515   // to avoid duplicating functions unneccesarily.
 516   //
 517   for (map<CallInst*, TransformFunctionInfo>::iterator I = CallMap.begin(),
 518          E = CallMap.end(); I != E; ++I) {
 519     // Make sure the entries are sorted.
 520     I->second.finalizeConstruction();
 521
 522     // Transform all of the functions we need, or at least ensure there is a
 523     // cached version available.
 524     transformFunction(I->second, IPFGraph);
 525   }
 526
 527   // Now that all of the functions that we want to call are available, transform
 528   // the local method so that it uses the pools locally and passes them to the
 529   // functions that we just hacked up.
 530   //
 531
 532   // First step, find the instructions to be modified.
 533   vector<Instruction*> InstToFix;
 534   for (unsigned i = 0, e = Scalars.size(); i != e; ++i) {
 535     Value *ScalarVal = Scalars[i].Val;
 536
 537     // Check to see if the scalar _IS_ an instruction.  If so, it is involved.
 538     if (Instruction *Inst = dyn_cast<Instruction>(ScalarVal))
 539       InstToFix.push_back(Inst);
 540
 541     // All all of the instructions that use the scalar as an operand...
 542     for (Value::use_iterator UI = ScalarVal->use_begin(),
 543            UE = ScalarVal->use_end(); UI != UE; ++UI)
 544       InstToFix.push_back(dyn_cast<Instruction>(*UI));
 545   }
 546
 547   // Eliminate duplicates by sorting, then removing equal neighbors.
 548   sort(InstToFix.begin(), InstToFix.end());
 549   InstToFix.erase(unique(InstToFix.begin(), InstToFix.end()), InstToFix.end());
 550
 551   // Use a FunctionBodyTransformer to transform all of the involved instructions
 552   FunctionBodyTransformer FBT(*this, Scalars, CallMap);
 553   for (unsigned i = 0, e = InstToFix.size(); i != e; ++i)
 554     FBT.visit(InstToFix[i]);
 555
 556
 557   // Since we have liberally hacked the function to pieces, we want to inform
 558   // the datastructure pass that its internal representation is out of date.
 559   //
 560   DS->invalidateFunction(F);
 561 }
 562
 563 static void addNodeMapping(DSNode *SrcNode, const PointerValSet &PVS,
 564                            map<DSNode*, PointerValSet> &NodeMapping) {
 565   for (unsigned i = 0, e = PVS.size(); i != e; ++i)
 566     if (NodeMapping[SrcNode].add(PVS[i])) {  // Not in map yet?
 567       assert(PVS[i].Index == 0 && "Node indexing not supported yet!");
 568       DSNode *DestNode = PVS[i].Node;
 569
 570       // Loop over all of the outgoing links in the mapped graph
 571       for (unsigned l = 0, le = DestNode->getNumOutgoingLinks(); l != le; ++l) {
 572         PointerValSet &SrcSet = SrcNode->getOutgoingLink(l);
 573         const PointerValSet &DestSet = DestNode->getOutgoingLink(l);
 574         assert((!SrcSet.empty() || DestSet.empty()) &&
 575                "Dest graph should be a proper subset of the src graph!");
 576
 577         // Add all of the node mappings now!
 578         for (unsigned si = 0, se = SrcSet.size(); si != se; ++si) {
 579           assert(SrcSet[si].Index == 0 && "Can't handle node offset!");
 580           addNodeMapping(SrcSet[si].Node, DestSet, NodeMapping);
 581         }
 582       }
 583     }
 584 }
 585
 586 // CalculateNodeMapping - There is a partial isomorphism between the graph
 587 // passed in and the graph that is actually used by the function.  We need to
 588 // figure out what this mapping is so that we can transformFunctionBody the
 589 // instructions in the function itself.  Note that every node in the graph that
 590 // we are interested in must be both in the local graph of the called function,
 591 // and in the local graph of the calling function.  Because of this, we only
 592 // define the mapping for these nodes [conveniently these are the only nodes we
 593 // CAN define a mapping for...]
 594 //
 595 // The roots of the graph that we are transforming is rooted in the arguments
 596 // passed into the function from the caller.  This is where we start our
 597 // mapping calculation.
 598 //
 599 // The NodeMapping calculated maps from the callers graph to the called graph.
 600 //
 601 static void CalculateNodeMapping(Function *F, TransformFunctionInfo &TFI,
 602                                  FunctionDSGraph &CallerGraph,
 603                                  FunctionDSGraph &CalledGraph,
 604                                  map<DSNode*, PointerValSet> &NodeMapping) {
 605   int LastArgNo = -2;
 606   for (unsigned i = 0, e = TFI.ArgInfo.size(); i != e; ++i) {
 607     // Figure out what nodes in the called graph the TFI.ArgInfo[i].Node node
 608     // corresponds to...
 609     //
 610     // Only consider first node of sequence.  Extra nodes may may be added
 611     // to the TFI if the data structure requires more nodes than just the
 612     // one the argument points to.  We are only interested in the one the
 613     // argument points to though.
 614     //
 615     if (TFI.ArgInfo[i].ArgNo != LastArgNo) {
 616       if (TFI.ArgInfo[i].ArgNo == -1) {
 617         addNodeMapping(TFI.ArgInfo[i].Node, CalledGraph.getRetNodes(),
 618                        NodeMapping);
 619       } else {
 620         // Figure out which node argument # ArgNo points to in the called graph.
 621         Value *Arg = F->getArgumentList()[TFI.ArgInfo[i].ArgNo];
 622         addNodeMapping(TFI.ArgInfo[i].Node, CalledGraph.getValueMap()[Arg],
 623                        NodeMapping);
 624       }
 625       LastArgNo = TFI.ArgInfo[i].ArgNo;
 626     }
 627   }
 628 }
 629
 630
 631 // transformFunction - Transform the specified function the specified way.  It
 632 // we have already transformed that function that way, don't do anything.  The
 633 // nodes in the TransformFunctionInfo come out of callers data structure graph.
 634 //
 635 void PoolAllocate::transformFunction(TransformFunctionInfo &TFI,
 636                                      FunctionDSGraph &CallerIPGraph) {
 637   if (getTransformedFunction(TFI)) return;  // Function xformation already done?
 638
 639   const FunctionType *OldFuncType = TFI.Func->getFunctionType();
 640
 641   assert(!OldFuncType->isVarArg() && "Vararg functions not handled yet!");
 642
 643   // Build the type for the new function that we are transforming
 644   vector<const Type*> ArgTys;
 645   for (unsigned i = 0, e = OldFuncType->getNumParams(); i != e; ++i)
 646     ArgTys.push_back(OldFuncType->getParamType(i));
 647
 648   // Add one pool pointer for every argument that needs to be supplemented.
 649   ArgTys.insert(ArgTys.end(), TFI.ArgInfo.size(), PoolTy);
 650
 651   // Build the new function type...
 652   const // FIXME when types are not const
 653   FunctionType *NewFuncType = FunctionType::get(OldFuncType->getReturnType(),
 654                                                 ArgTys,OldFuncType->isVarArg());
 655
 656   // The new function is internal, because we know that only we can call it.
 657   // This also helps subsequent IP transformations to eliminate duplicated pool
 658   // pointers. [in the future when they are implemented].
 659   //
 660   Function *NewFunc = new Function(NewFuncType, true,
 661                                    TFI.Func->getName()+".poolxform");
 662   CurModule->getFunctionList().push_back(NewFunc);
 663
 664   // Add the newly formed function to the TransformedFunctions table so that
 665   // infinite recursion does not occur!
 666   //
 667   TransformedFunctions[TFI] = NewFunc;
 668
 669   // Add arguments to the function... starting with all of the old arguments
 670   vector<Value*> ArgMap;
 671   for (unsigned i = 0, e = TFI.Func->getArgumentList().size(); i != e; ++i) {
 672     const FunctionArgument *OFA = TFI.Func->getArgumentList()[i];
 673     FunctionArgument *NFA = new FunctionArgument(OFA->getType(),OFA->getName());
 674     NewFunc->getArgumentList().push_back(NFA);
 675     ArgMap.push_back(NFA);  // Keep track of the arguments
 676   }
 677
 678   // Now add all of the arguments corresponding to pools passed in...
 679   for (unsigned i = 0, e = TFI.ArgInfo.size(); i != e; ++i) {
 680     string Name;
 681     if (TFI.ArgInfo[i].ArgNo == -1)
 682       Name = "retpool";
 683     else
 684       Name = ArgMap[TFI.ArgInfo[i].ArgNo]->getName();  // Get the arg name
 685     FunctionArgument *NFA = new FunctionArgument(PoolTy, Name+".pool");
 686     NewFunc->getArgumentList().push_back(NFA);
 687   }
 688
 689   // Now clone the body of the old function into the new function...
 690   CloneFunctionInto(NewFunc, TFI.Func, ArgMap);
 691
 692   // Okay, now we have a function that is identical to the old one, except that
 693   // it has extra arguments for the pools coming in.  Now we have to get the
 694   // data structure graph for the function we are replacing, and figure out how
 695   // our graph nodes map to the graph nodes in the dest function.
 696   //
 697   FunctionDSGraph &DSGraph = DS->getClosedDSGraph(NewFunc);
 698
 699   // NodeMapping - Multimap from callers graph to called graph.
 700   //
 701   map<DSNode*, PointerValSet> NodeMapping;
 702
 703   CalculateNodeMapping(NewFunc, TFI, CallerIPGraph, DSGraph,
 704                        NodeMapping);
 705
 706   // Print out the node mapping...
 707   cerr << "\nNode mapping for call of " << NewFunc->getName() << "\n";
 708   for (map<DSNode*, PointerValSet>::iterator I = NodeMapping.begin();
 709        I != NodeMapping.end(); ++I) {
 710     cerr << "Map: "; I->first->print(cerr);
 711     cerr << "To:  "; I->second.print(cerr);
 712     cerr << "\n";
 713   }
 714
 715   // Fill in the PoolDescriptor information for the transformed function so that
 716   // it can determine which value holds the pool descriptor for each data
 717   // structure node that it accesses.
 718   //
 719   map<DSNode*, Value*> PoolDescriptors;
 720
 721   cerr << "\nCalculating the pool descriptor map:\n";
 722
 723   // All of the pool descriptors must be passed in as arguments...
 724   for (unsigned i = 0, e = TFI.ArgInfo.size(); i != e; ++i) {
 725     DSNode *CallerNode = TFI.ArgInfo[i].Node;
 726     Value  *CallerPool = TFI.ArgInfo[i].PoolHandle;
 727
 728     cerr << "Mapped caller node: "; CallerNode->print(cerr);
 729     cerr << "Mapped caller pool: "; CallerPool->dump();
 730
 731     // Calculate the argument number that the pool is to the function call...
 732     // The call instruction should not have the pool operands added yet.
 733     unsigned ArgNo = TFI.Call->getNumOperands()-1+i;
 734     cerr << "Should be argument #: " << ArgNo << "[i = " << i << "]\n";
 735     assert(ArgNo < NewFunc->getArgumentList().size() &&
 736            "Call already has pool arguments added??");
 737
 738     // Map the pool argument into the called function...
 739     Value *CalleePool = NewFunc->getArgumentList()[ArgNo];
 740
 741     // Map the DSNode into the callee's DSGraph
 742     const PointerValSet &CalleeNodes = NodeMapping[CallerNode];
 743     for (unsigned n = 0, ne = CalleeNodes.size(); n != ne; ++n) {
 744       assert(CalleeNodes[n].Index == 0 && "Indexed node not handled yet!");
 745       DSNode *CalleeNode = CalleeNodes[n].Node;
 746
 747       cerr << "*** to callee node: "; CalleeNode->print(cerr);
 748       cerr << "*** to callee pool: "; CalleePool->dump();
 749       cerr << "\n";
 750
 751       assert(CalleeNode && CalleePool && "Invalid nodes!");
 752       Value *&PV = PoolDescriptors[CalleeNode];
 753       //assert((PV == 0 || PV == CalleePool) && "Invalid node remapping!");
 754       PV = CalleePool;         // Update the pool descriptor map!
 755     }
 756   }
 757
 758   // We must destroy the node mapping so that we don't have latent references
 759   // into the data structure graph for the new function.  Otherwise we get
 760   // assertion failures when transformFunctionBody tries to invalidate the
 761   // graph.
 762   //
 763   NodeMapping.clear();
 764
 765   // Now that we know everything we need about the function, transform the body
 766   // now!
 767   //
 768   transformFunctionBody(NewFunc, DSGraph, PoolDescriptors);
 769
 770   cerr << "Function after transformation:\n";
 771   NewFunc->dump();
 772 }
 773
 774
 775 // CreatePools - Insert instructions into the function we are processing to
 776 // create all of the memory pool objects themselves.  This also inserts
 777 // destruction code.  Add an alloca for each pool that is allocated to the
 778 // PoolDescriptors vector.
 779 //
 780 void PoolAllocate::CreatePools(Function *F, const vector<AllocDSNode*> &Allocs,
 781                                map<DSNode*, Value*> &PoolDescriptors) {
 782   // FIXME: This should use an IP version of the UnifyAllExits pass!
 783   vector<BasicBlock*> ReturnNodes;
 784   for (Function::iterator I = F->begin(), E = F->end(); I != E; ++I)
 785     if (isa<ReturnInst>((*I)->getTerminator()))
 786       ReturnNodes.push_back(*I);
 787
 788
 789   // Create the code that goes in the entry and exit nodes for the method...
 790   vector<Instruction*> EntryNodeInsts;
 791   for (unsigned i = 0, e = Allocs.size(); i != e; ++i) {
 792     // Add an allocation and a free for each pool...
 793     AllocaInst *PoolAlloc = new AllocaInst(PoolTy, 0, "pool");
 794     EntryNodeInsts.push_back(PoolAlloc);
 795     PoolDescriptors[Allocs[i]] = PoolAlloc;   // Keep track of pool allocas
 796     AllocationInst *AI = Allocs[i]->getAllocation();
 797
 798     // Initialize the pool.  We need to know how big each allocation is.  For
 799     // our purposes here, we assume we are allocating a scalar, or array of
 800     // constant size.
 801     //
 802     unsigned ElSize = TargetData.getTypeSize(AI->getAllocatedType());
 803     ElSize *= cast<ConstantUInt>(AI->getArraySize())->getValue();
 804
 805     vector<Value*> Args;
 806     Args.push_back(PoolAlloc);    // Pool to initialize
 807     Args.push_back(ConstantUInt::get(Type::UIntTy, ElSize));
 808     EntryNodeInsts.push_back(new CallInst(PoolInit, Args));
 809
 810     // Destroy the pool...
 811     Args.pop_back();
 812
 813     for (unsigned EN = 0, ENE = ReturnNodes.size(); EN != ENE; ++EN) {
 814       Instruction *Destroy = new CallInst(PoolDestroy, Args);
 815
 816       // Insert it before the return instruction...
 817       BasicBlock *RetNode = ReturnNodes[EN];
 818       RetNode->getInstList().insert(RetNode->end()-1, Destroy);
 819     }
 820   }
 821
 822   // Insert the entry node code into the entry block...
 823   F->getEntryNode()->getInstList().insert(F->getEntryNode()->begin()+1,
 824                                           EntryNodeInsts.begin(),
 825                                           EntryNodeInsts.end());
 826 }
 827
 828
 829 // addPoolPrototypes - Add prototypes for the pool methods to the specified
 830 // module and update the Pool* instance variables to point to them.
 831 //
 832 void PoolAllocate::addPoolPrototypes(Module *M) {
 833   // Get PoolInit function...
 834   vector<const Type*> Args;
 835   Args.push_back(PoolTy);           // Pool to initialize
 836   Args.push_back(Type::UIntTy);     // Num bytes per element
 837   FunctionType *PoolInitTy = FunctionType::get(Type::VoidTy, Args, false);
 838   PoolInit = M->getOrInsertFunction("poolinit", PoolInitTy);
 839
 840   // Get pooldestroy function...
 841   Args.pop_back();  // Only takes a pool...
 842   FunctionType *PoolDestroyTy = FunctionType::get(Type::VoidTy, Args, false);
 843   PoolDestroy = M->getOrInsertFunction("pooldestroy", PoolDestroyTy);
 844
 845   const Type *PtrVoid = PointerType::get(Type::SByteTy);
 846
 847   // Get the poolalloc function...
 848   FunctionType *PoolAllocTy = FunctionType::get(PtrVoid, Args, false);
 849   PoolAlloc = M->getOrInsertFunction("poolalloc", PoolAllocTy);
 850
 851   // Get the poolfree function...
 852   Args.push_back(PtrVoid);
 853   FunctionType *PoolFreeTy = FunctionType::get(Type::VoidTy, Args, false);
 854   PoolFree = M->getOrInsertFunction("poolfree", PoolFreeTy);
 855
 856   // Add the %PoolTy type to the symbol table of the module...
 857   M->addTypeName("PoolTy", PoolTy->getElementType());
 858 }
 859
 860
 861 bool PoolAllocate::run(Module *M) {
 862   addPoolPrototypes(M);
 863   CurModule = M;
 864
 865   DS = &getAnalysis<DataStructure>();
 866   bool Changed = false;
 867
 868   // We cannot use an iterator here because it will get invalidated when we add
 869   // functions to the module later...
 870   for (unsigned i = 0; i != M->size(); ++i)
 871     if (!M->getFunctionList()[i]->isExternal()) {
 872       Changed |= processFunction(M->getFunctionList()[i]);
 873       if (Changed) {
 874         cerr << "Only processing one function\n";
 875         break;
 876       }
 877     }
 878
 879   CurModule = 0;
 880   DS = 0;
 881   return false;
 882 }
 883
 884
 885 // createPoolAllocatePass - Global function to access the functionality of this
 886 // pass...
 887 //
 888 Pass *createPoolAllocatePass() { return new PoolAllocate(); }