Change encoding of instruction operands in bitcode binaries to be relative

[oota-llvm.git] / lib / Bitcode / Writer / BitcodeWriter.cpp
diff --git a/lib/Bitcode/Writer/BitcodeWriter.cpp b/lib/Bitcode/Writer/BitcodeWriter.cpp

index 48f60bc3c57c983f8626bef55df74972a9a8d5ad..efa60b8e0763c714af6cf480d8b882e56b114153 100644 (file)
--- a/lib/Bitcode/Writer/BitcodeWriter.cpp
+++ b/lib/Bitcode/Writer/BitcodeWriter.cpp
@@ -41,8 +41,6 @@ EnablePreserveUseListOrdering("enable-bc-uselist-preserve",
  /// These are manifest constants used by the bitcode writer. They do not need to
  /// be kept in sync with the reader, but need to be consistent within this file.
  enum {
-  CurVersion = 0,
-
    // VALUE_SYMTAB_BLOCK abbrev id's.
    VST_ENTRY_8_ABBREV = bitc::FIRST_APPLICATION_ABBREV,
    VST_ENTRY_7_ABBREV,
@@ -62,7 +60,10 @@ enum {
    FUNCTION_INST_CAST_ABBREV,
    FUNCTION_INST_RET_VOID_ABBREV,
    FUNCTION_INST_RET_VAL_ABBREV,
-  FUNCTION_INST_UNREACHABLE_ABBREV
+  FUNCTION_INST_UNREACHABLE_ABBREV,
+  
+  // SwitchInst Magic
+  SWITCH_INST_MAGIC = 0x4B5 // May 2012 => 1205 => Hex
  };
  
  static unsigned GetEncodedCastOpcode(unsigned Opcode) {
@@ -126,7 +127,6 @@ static unsigned GetEncodedRMWOperation(AtomicRMWInst::BinOp Op) {
  
  static unsigned GetEncodedOrdering(AtomicOrdering Ordering) {
    switch (Ordering) {
-  default: llvm_unreachable("Unknown atomic ordering");
    case NotAtomic: return bitc::ORDERING_NOTATOMIC;
    case Unordered: return bitc::ORDERING_UNORDERED;
    case Monotonic: return bitc::ORDERING_MONOTONIC;
@@ -135,14 +135,15 @@ static unsigned GetEncodedOrdering(AtomicOrdering Ordering) {
    case AcquireRelease: return bitc::ORDERING_ACQREL;
    case SequentiallyConsistent: return bitc::ORDERING_SEQCST;
    }
+  llvm_unreachable("Invalid ordering");
  }
  
  static unsigned GetEncodedSynchScope(SynchronizationScope SynchScope) {
    switch (SynchScope) {
-  default: llvm_unreachable("Unknown synchronization scope");
    case SingleThread: return bitc::SYNCHSCOPE_SINGLETHREAD;
    case CrossThread: return bitc::SYNCHSCOPE_CROSSTHREAD;
    }
+  llvm_unreachable("Invalid synch scope");
  }
  
  static void WriteStringRecord(unsigned Code, StringRef Str,
@@ -174,17 +175,7 @@ static void WriteAttributeTable(const ValueEnumerator &VE,
      for (unsigned i = 0, e = A.getNumSlots(); i != e; ++i) {
        const AttributeWithIndex &PAWI = A.getSlot(i);
        Record.push_back(PAWI.Index);
-
-      // FIXME: remove in LLVM 3.0
-      // Store the alignment in the bitcode as a 16-bit raw value instead of a
-      // 5-bit log2 encoded value. Shift the bits above the alignment up by
-      // 11 bits.
-      uint64_t FauxAttr = PAWI.Attrs & 0xffff;
-      if (PAWI.Attrs & Attribute::Alignment)
-        FauxAttr |= (1ull<<16)<<(((PAWI.Attrs & Attribute::Alignment)-1) >> 16);
-      FauxAttr |= (PAWI.Attrs & (0x3FFull << 21)) << 11;
-
-      Record.push_back(FauxAttr);
+      Record.push_back(Attributes::encodeLLVMAttributesForBitcode(PAWI.Attrs));
      }
  
      Stream.EmitRecord(bitc::PARAMATTR_CODE_ENTRY, Record);
@@ -201,11 +192,12 @@ static void WriteTypeTable(const ValueEnumerator &VE, BitstreamWriter &Stream) {
    Stream.EnterSubblock(bitc::TYPE_BLOCK_ID_NEW, 4 /*count from # abbrevs */);
    SmallVector<uint64_t, 64> TypeVals;
  
+  uint64_t NumBits = Log2_32_Ceil(VE.getTypes().size()+1);
+
    // Abbrev for TYPE_CODE_POINTER.
    BitCodeAbbrev *Abbv = new BitCodeAbbrev();
    Abbv->Add(BitCodeAbbrevOp(bitc::TYPE_CODE_POINTER));
-  Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed,
-                            Log2_32_Ceil(VE.getTypes().size()+1)));
+  Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed, NumBits));
    Abbv->Add(BitCodeAbbrevOp(0));  // Addrspace = 0
    unsigned PtrAbbrev = Stream.EmitAbbrev(Abbv);
  
@@ -214,8 +206,8 @@ static void WriteTypeTable(const ValueEnumerator &VE, BitstreamWriter &Stream) {
    Abbv->Add(BitCodeAbbrevOp(bitc::TYPE_CODE_FUNCTION));
    Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed, 1));  // isvararg
    Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Array));
-  Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed,
-                            Log2_32_Ceil(VE.getTypes().size()+1)));
+  Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed, NumBits));
+
    unsigned FunctionAbbrev = Stream.EmitAbbrev(Abbv);
  
    // Abbrev for TYPE_CODE_STRUCT_ANON.
@@ -223,8 +215,8 @@ static void WriteTypeTable(const ValueEnumerator &VE, BitstreamWriter &Stream) {
    Abbv->Add(BitCodeAbbrevOp(bitc::TYPE_CODE_STRUCT_ANON));
    Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed, 1));  // ispacked
    Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Array));
-  Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed,
-                            Log2_32_Ceil(VE.getTypes().size()+1)));
+  Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed, NumBits));
+
    unsigned StructAnonAbbrev = Stream.EmitAbbrev(Abbv);
  
    // Abbrev for TYPE_CODE_STRUCT_NAME.
@@ -239,16 +231,16 @@ static void WriteTypeTable(const ValueEnumerator &VE, BitstreamWriter &Stream) {
    Abbv->Add(BitCodeAbbrevOp(bitc::TYPE_CODE_STRUCT_NAMED));
    Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed, 1));  // ispacked
    Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Array));
-  Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed,
-                            Log2_32_Ceil(VE.getTypes().size()+1)));
+  Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed, NumBits));
+
    unsigned StructNamedAbbrev = Stream.EmitAbbrev(Abbv);
    
    // Abbrev for TYPE_CODE_ARRAY.
    Abbv = new BitCodeAbbrev();
    Abbv->Add(BitCodeAbbrevOp(bitc::TYPE_CODE_ARRAY));
    Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::VBR, 8));   // size
-  Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed,
-                            Log2_32_Ceil(VE.getTypes().size()+1)));
+  Abbv->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed, NumBits));
+
    unsigned ArrayAbbrev = Stream.EmitAbbrev(Abbv);
  
    // Emit an entry count so the reader can reserve space.
@@ -265,6 +257,7 @@ static void WriteTypeTable(const ValueEnumerator &VE, BitstreamWriter &Stream) {
      switch (T->getTypeID()) {
      default: llvm_unreachable("Unknown type!");
      case Type::VoidTyID:      Code = bitc::TYPE_CODE_VOID;   break;
+    case Type::HalfTyID:      Code = bitc::TYPE_CODE_HALF;   break;
      case Type::FloatTyID:     Code = bitc::TYPE_CODE_FLOAT;  break;
      case Type::DoubleTyID:    Code = bitc::TYPE_CODE_DOUBLE; break;
      case Type::X86_FP80TyID:  Code = bitc::TYPE_CODE_X86_FP80; break;
@@ -355,7 +348,6 @@ static void WriteTypeTable(const ValueEnumerator &VE, BitstreamWriter &Stream) {
  
  static unsigned getEncodedLinkage(const GlobalValue *GV) {
    switch (GV->getLinkage()) {
-  default: llvm_unreachable("Invalid linkage!");
    case GlobalValue::ExternalLinkage:                 return 0;
    case GlobalValue::WeakAnyLinkage:                  return 1;
    case GlobalValue::AppendingLinkage:                return 2;
@@ -371,17 +363,29 @@ static unsigned getEncodedLinkage(const GlobalValue *GV) {
    case GlobalValue::AvailableExternallyLinkage:      return 12;
    case GlobalValue::LinkerPrivateLinkage:            return 13;
    case GlobalValue::LinkerPrivateWeakLinkage:        return 14;
-  case GlobalValue::LinkerPrivateWeakDefAutoLinkage: return 15;
+  case GlobalValue::LinkOnceODRAutoHideLinkage:      return 15;
    }
+  llvm_unreachable("Invalid linkage");
  }
  
  static unsigned getEncodedVisibility(const GlobalValue *GV) {
    switch (GV->getVisibility()) {
-  default: llvm_unreachable("Invalid visibility!");
    case GlobalValue::DefaultVisibility:   return 0;
    case GlobalValue::HiddenVisibility:    return 1;
    case GlobalValue::ProtectedVisibility: return 2;
    }
+  llvm_unreachable("Invalid visibility");
+}
+
+static unsigned getEncodedThreadLocalMode(const GlobalVariable *GV) {
+  switch (GV->getThreadLocalMode()) {
+    case GlobalVariable::NotThreadLocal:         return 0;
+    case GlobalVariable::GeneralDynamicTLSModel: return 1;
+    case GlobalVariable::LocalDynamicTLSModel:   return 2;
+    case GlobalVariable::InitialExecTLSModel:    return 3;
+    case GlobalVariable::LocalExecTLSModel:      return 4;
+  }
+  llvm_unreachable("Invalid TLS model");
  }
  
  // Emit top-level description of module, including target triple, inline asm,
@@ -492,7 +496,7 @@ static void WriteModuleInfo(const Module *M, const ValueEnumerator &VE,
          GV->getVisibility() != GlobalValue::DefaultVisibility ||
          GV->hasUnnamedAddr()) {
        Vals.push_back(getEncodedVisibility(GV));
-      Vals.push_back(GV->isThreadLocal());
+      Vals.push_back(getEncodedThreadLocalMode(GV));
        Vals.push_back(GV->hasUnnamedAddr());
      } else {
        AbbrevToUse = SimpleGVarAbbrev;
@@ -504,8 +508,8 @@ static void WriteModuleInfo(const Module *M, const ValueEnumerator &VE,
  
    // Emit the function proto information.
    for (Module::const_iterator F = M->begin(), E = M->end(); F != E; ++F) {
-    // FUNCTION:  [type, callingconv, isproto, paramattr,
-    //             linkage, alignment, section, visibility, gc, unnamed_addr]
+    // FUNCTION:  [type, callingconv, isproto, linkage, paramattrs, alignment,
+    //             section, visibility, gc, unnamed_addr]
      Vals.push_back(VE.getTypeID(F->getType()));
      Vals.push_back(F->getCallingConv());
      Vals.push_back(F->isDeclaration());
@@ -525,6 +529,7 @@ static void WriteModuleInfo(const Module *M, const ValueEnumerator &VE,
    // Emit the alias information.
    for (Module::const_alias_iterator AI = M->alias_begin(), E = M->alias_end();
         AI != E; ++AI) {
+    // ALIAS: [alias type, aliasee val#, linkage, visibility]
      Vals.push_back(VE.getTypeID(AI->getType()));
      Vals.push_back(VE.getValueID(AI->getAliasee()));
      Vals.push_back(getEncodedLinkage(AI));
@@ -715,6 +720,41 @@ static void WriteModuleMetadataStore(const Module *M, BitstreamWriter &Stream) {
    Stream.ExitBlock();
  }
  
+static void emitSignedInt64(SmallVectorImpl<uint64_t> &Vals, uint64_t V) {
+  if ((int64_t)V >= 0)
+    Vals.push_back(V << 1);
+  else
+    Vals.push_back((-V << 1) | 1);
+}
+
+static void EmitAPInt(SmallVectorImpl<uint64_t> &Vals,
+                      unsigned &Code, unsigned &AbbrevToUse, const APInt &Val,
+                      bool EmitSizeForWideNumbers = false
+                      ) {
+  if (Val.getBitWidth() <= 64) {
+    uint64_t V = Val.getSExtValue();
+    emitSignedInt64(Vals, V);
+    Code = bitc::CST_CODE_INTEGER;
+    AbbrevToUse = CONSTANTS_INTEGER_ABBREV;
+  } else {
+    // Wide integers, > 64 bits in size.
+    // We have an arbitrary precision integer value to write whose
+    // bit width is > 64. However, in canonical unsigned integer
+    // format it is likely that the high bits are going to be zero.
+    // So, we only write the number of active words.
+    unsigned NWords = Val.getActiveWords();
+    
+    if (EmitSizeForWideNumbers)
+      Vals.push_back(NWords);
+    
+    const uint64_t *RawWords = Val.getRawData();
+    for (unsigned i = 0; i != NWords; ++i) {
+      emitSignedInt64(Vals, RawWords[i]);
+    }
+    Code = bitc::CST_CODE_WIDE_INTEGER;
+  }
+}
+
  static void WriteConstants(unsigned FirstVal, unsigned LastVal,
                             const ValueEnumerator &VE,
                             BitstreamWriter &Stream, bool isGlobal) {
@@ -772,7 +812,8 @@ static void WriteConstants(unsigned FirstVal, unsigned LastVal,
  
      if (const InlineAsm *IA = dyn_cast<InlineAsm>(V)) {
        Record.push_back(unsigned(IA->hasSideEffects()) |
-                       unsigned(IA->isAlignStack()) << 1);
+                       unsigned(IA->isAlignStack()) << 1 |
+                       unsigned(IA->getDialect()&1) << 2);
  
        // Add the asm string.
        const std::string &AsmStr = IA->getAsmString();
@@ -797,34 +838,11 @@ static void WriteConstants(unsigned FirstVal, unsigned LastVal,
      } else if (isa<UndefValue>(C)) {
        Code = bitc::CST_CODE_UNDEF;
      } else if (const ConstantInt *IV = dyn_cast<ConstantInt>(C)) {
-      if (IV->getBitWidth() <= 64) {
-        uint64_t V = IV->getSExtValue();
-        if ((int64_t)V >= 0)
-          Record.push_back(V << 1);
-        else
-          Record.push_back((-V << 1) | 1);
-        Code = bitc::CST_CODE_INTEGER;
-        AbbrevToUse = CONSTANTS_INTEGER_ABBREV;
-      } else {                             // Wide integers, > 64 bits in size.
-        // We have an arbitrary precision integer value to write whose
-        // bit width is > 64. However, in canonical unsigned integer
-        // format it is likely that the high bits are going to be zero.
-        // So, we only write the number of active words.
-        unsigned NWords = IV->getValue().getActiveWords();
-        const uint64_t *RawWords = IV->getValue().getRawData();
-        for (unsigned i = 0; i != NWords; ++i) {
-          int64_t V = RawWords[i];
-          if (V >= 0)
-            Record.push_back(V << 1);
-          else
-            Record.push_back((-V << 1) | 1);
-        }
-        Code = bitc::CST_CODE_WIDE_INTEGER;
-      }
+      EmitAPInt(Record, Code, AbbrevToUse, IV->getValue());
      } else if (const ConstantFP *CFP = dyn_cast<ConstantFP>(C)) {
        Code = bitc::CST_CODE_FLOAT;
        Type *Ty = CFP->getType();
-      if (Ty->isFloatTy() || Ty->isDoubleTy()) {
+      if (Ty->isHalfTy() || Ty->isFloatTy() || Ty->isDoubleTy()) {
          Record.push_back(CFP->getValueAPF().bitcastToAPInt().getZExtValue());
        } else if (Ty->isX86_FP80Ty()) {
          // api needed to prevent premature destruction
@@ -841,34 +859,56 @@ static void WriteConstants(unsigned FirstVal, unsigned LastVal,
        } else {
          assert (0 && "Unknown FP type!");
        }
-    } else if (isa<ConstantArray>(C) && cast<ConstantArray>(C)->isString()) {
-      const ConstantArray *CA = cast<ConstantArray>(C);
+    } else if (isa<ConstantDataSequential>(C) &&
+               cast<ConstantDataSequential>(C)->isString()) {
+      const ConstantDataSequential *Str = cast<ConstantDataSequential>(C);
        // Emit constant strings specially.
-      unsigned NumOps = CA->getNumOperands();
+      unsigned NumElts = Str->getNumElements();
        // If this is a null-terminated string, use the denser CSTRING encoding.
-      if (CA->getOperand(NumOps-1)->isNullValue()) {
+      if (Str->isCString()) {
          Code = bitc::CST_CODE_CSTRING;
-        --NumOps;  // Don't encode the null, which isn't allowed by char6.
+        --NumElts;  // Don't encode the null, which isn't allowed by char6.
        } else {
          Code = bitc::CST_CODE_STRING;
          AbbrevToUse = String8Abbrev;
        }
        bool isCStr7 = Code == bitc::CST_CODE_CSTRING;
        bool isCStrChar6 = Code == bitc::CST_CODE_CSTRING;
-      for (unsigned i = 0; i != NumOps; ++i) {
-        unsigned char V = cast<ConstantInt>(CA->getOperand(i))->getZExtValue();
+      for (unsigned i = 0; i != NumElts; ++i) {
+        unsigned char V = Str->getElementAsInteger(i);
          Record.push_back(V);
          isCStr7 &= (V & 128) == 0;
          if (isCStrChar6)
            isCStrChar6 = BitCodeAbbrevOp::isChar6(V);
        }
-
+      
        if (isCStrChar6)
          AbbrevToUse = CString6Abbrev;
        else if (isCStr7)
          AbbrevToUse = CString7Abbrev;
-    } else if (isa<ConstantArray>(C) || isa<ConstantStruct>(V) ||
-               isa<ConstantVector>(V)) {
+    } else if (const ConstantDataSequential *CDS = 
+                  dyn_cast<ConstantDataSequential>(C)) {
+      Code = bitc::CST_CODE_DATA;
+      Type *EltTy = CDS->getType()->getElementType();
+      if (isa<IntegerType>(EltTy)) {
+        for (unsigned i = 0, e = CDS->getNumElements(); i != e; ++i)
+          Record.push_back(CDS->getElementAsInteger(i));
+      } else if (EltTy->isFloatTy()) {
+        for (unsigned i = 0, e = CDS->getNumElements(); i != e; ++i) {
+          union { float F; uint32_t I; };
+          F = CDS->getElementAsFloat(i);
+          Record.push_back(I);
+        }
+      } else {
+        assert(EltTy->isDoubleTy() && "Unknown ConstantData element type");
+        for (unsigned i = 0, e = CDS->getNumElements(); i != e; ++i) {
+          union { double F; uint64_t I; };
+          F = CDS->getElementAsDouble(i);
+          Record.push_back(I);
+        }
+      }
+    } else if (isa<ConstantArray>(C) || isa<ConstantStruct>(C) ||
+               isa<ConstantVector>(C)) {
        Code = bitc::CST_CODE_AGGREGATE;
        for (unsigned i = 0, e = C->getNumOperands(); i != e; ++i)
          Record.push_back(VE.getValueID(C->getOperand(i)));
@@ -983,12 +1023,13 @@ static void WriteModuleConstants(const ValueEnumerator &VE,
  ///
  /// This function adds V's value ID to Vals.  If the value ID is higher than the
  /// instruction ID, then it is a forward reference, and it also includes the
-/// type ID.
+/// type ID.  The value ID that is written is encoded relative to the InstID.
  static bool PushValueAndType(const Value *V, unsigned InstID,
                               SmallVector<unsigned, 64> &Vals,
                               ValueEnumerator &VE) {
    unsigned ValID = VE.getValueID(V);
-  Vals.push_back(ValID);
+  // Make encoding relative to the InstID.
+  Vals.push_back(InstID - ValID);
    if (ValID >= InstID) {
      Vals.push_back(VE.getTypeID(V->getType()));
      return true;
@@ -996,6 +1037,30 @@ static bool PushValueAndType(const Value *V, unsigned InstID,
    return false;
  }
  
+/// pushValue - Like PushValueAndType, but where the type of the value is
+/// omitted (perhaps it was already encoded in an earlier operand).
+static void pushValue(const Value *V, unsigned InstID,
+                      SmallVector<unsigned, 64> &Vals,
+                      ValueEnumerator &VE) {
+  unsigned ValID = VE.getValueID(V);
+  Vals.push_back(InstID - ValID);
+}
+
+static void pushValue64(const Value *V, unsigned InstID,
+                        SmallVector<uint64_t, 128> &Vals,
+                        ValueEnumerator &VE) {
+  uint64_t ValID = VE.getValueID(V);
+  Vals.push_back(InstID - ValID);
+}
+
+static void pushValueSigned(const Value *V, unsigned InstID,
+                            SmallVector<uint64_t, 128> &Vals,
+                            ValueEnumerator &VE) {
+  unsigned ValID = VE.getValueID(V);
+  int64_t diff = ((int32_t)InstID - (int32_t)ValID);
+  emitSignedInt64(Vals, diff);
+}
+
  /// WriteInstruction - Emit an instruction to the specified stream.
  static void WriteInstruction(const Instruction &I, unsigned InstID,
                               ValueEnumerator &VE, BitstreamWriter &Stream,
@@ -1016,7 +1081,7 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
        Code = bitc::FUNC_CODE_INST_BINOP;
        if (!PushValueAndType(I.getOperand(0), InstID, Vals, VE))
          AbbrevToUse = FUNCTION_INST_BINOP_ABBREV;
-      Vals.push_back(VE.getValueID(I.getOperand(1)));
+      pushValue(I.getOperand(1), InstID, Vals, VE);
        Vals.push_back(GetEncodedBinaryOpcode(I.getOpcode()));
        uint64_t Flags = GetOptimizationFlags(&I);
        if (Flags != 0) {
@@ -1054,32 +1119,32 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
    case Instruction::Select:
      Code = bitc::FUNC_CODE_INST_VSELECT;
      PushValueAndType(I.getOperand(1), InstID, Vals, VE);
-    Vals.push_back(VE.getValueID(I.getOperand(2)));
+    pushValue(I.getOperand(2), InstID, Vals, VE);
      PushValueAndType(I.getOperand(0), InstID, Vals, VE);
      break;
    case Instruction::ExtractElement:
      Code = bitc::FUNC_CODE_INST_EXTRACTELT;
      PushValueAndType(I.getOperand(0), InstID, Vals, VE);
-    Vals.push_back(VE.getValueID(I.getOperand(1)));
+    pushValue(I.getOperand(1), InstID, Vals, VE);
      break;
    case Instruction::InsertElement:
      Code = bitc::FUNC_CODE_INST_INSERTELT;
      PushValueAndType(I.getOperand(0), InstID, Vals, VE);
-    Vals.push_back(VE.getValueID(I.getOperand(1)));
-    Vals.push_back(VE.getValueID(I.getOperand(2)));
+    pushValue(I.getOperand(1), InstID, Vals, VE);
+    pushValue(I.getOperand(2), InstID, Vals, VE);
      break;
    case Instruction::ShuffleVector:
      Code = bitc::FUNC_CODE_INST_SHUFFLEVEC;
      PushValueAndType(I.getOperand(0), InstID, Vals, VE);
-    Vals.push_back(VE.getValueID(I.getOperand(1)));
-    Vals.push_back(VE.getValueID(I.getOperand(2)));
+    pushValue(I.getOperand(1), InstID, Vals, VE);
+    pushValue(I.getOperand(2), InstID, Vals, VE);
      break;
    case Instruction::ICmp:
    case Instruction::FCmp:
      // compare returning Int1Ty or vector of Int1Ty
      Code = bitc::FUNC_CODE_INST_CMP2;
      PushValueAndType(I.getOperand(0), InstID, Vals, VE);
-    Vals.push_back(VE.getValueID(I.getOperand(1)));
+    pushValue(I.getOperand(1), InstID, Vals, VE);
      Vals.push_back(cast<CmpInst>(I).getPredicate());
      break;
  
@@ -1105,20 +1170,77 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
        Vals.push_back(VE.getValueID(II.getSuccessor(0)));
        if (II.isConditional()) {
          Vals.push_back(VE.getValueID(II.getSuccessor(1)));
-        Vals.push_back(VE.getValueID(II.getCondition()));
+        pushValue(II.getCondition(), InstID, Vals, VE);
        }
      }
      break;
    case Instruction::Switch:
-    Code = bitc::FUNC_CODE_INST_SWITCH;
-    Vals.push_back(VE.getTypeID(I.getOperand(0)->getType()));
-    for (unsigned i = 0, e = I.getNumOperands(); i != e; ++i)
-      Vals.push_back(VE.getValueID(I.getOperand(i)));
+    {
+      // Redefine Vals, since here we need to use 64 bit values
+      // explicitly to store large APInt numbers.
+      SmallVector<uint64_t, 128> Vals64;
+      
+      Code = bitc::FUNC_CODE_INST_SWITCH;
+      SwitchInst &SI = cast<SwitchInst>(I);
+      
+      uint32_t SwitchRecordHeader = SI.hash() | (SWITCH_INST_MAGIC << 16); 
+      Vals64.push_back(SwitchRecordHeader);      
+      
+      Vals64.push_back(VE.getTypeID(SI.getCondition()->getType()));
+      pushValue64(SI.getCondition(), InstID, Vals64, VE);
+      Vals64.push_back(VE.getValueID(SI.getDefaultDest()));
+      Vals64.push_back(SI.getNumCases());
+      for (SwitchInst::CaseIt i = SI.case_begin(), e = SI.case_end();
+           i != e; ++i) {
+        IntegersSubset& CaseRanges = i.getCaseValueEx();
+        unsigned Code, Abbrev; // will unused.
+        
+        if (CaseRanges.isSingleNumber()) {
+          Vals64.push_back(1/*NumItems = 1*/);
+          Vals64.push_back(true/*IsSingleNumber = true*/);
+          EmitAPInt(Vals64, Code, Abbrev, CaseRanges.getSingleNumber(0), true);
+        } else {
+          
+          Vals64.push_back(CaseRanges.getNumItems());
+          
+          if (CaseRanges.isSingleNumbersOnly()) {
+            for (unsigned ri = 0, rn = CaseRanges.getNumItems();
+                 ri != rn; ++ri) {
+              
+              Vals64.push_back(true/*IsSingleNumber = true*/);
+              
+              EmitAPInt(Vals64, Code, Abbrev,
+                        CaseRanges.getSingleNumber(ri), true);
+            }
+          } else
+            for (unsigned ri = 0, rn = CaseRanges.getNumItems();
+                 ri != rn; ++ri) {
+              IntegersSubset::Range r = CaseRanges.getItem(ri);
+              bool IsSingleNumber = CaseRanges.isSingleNumber(ri);
+    
+              Vals64.push_back(IsSingleNumber);
+              
+              EmitAPInt(Vals64, Code, Abbrev, r.getLow(), true);
+              if (!IsSingleNumber)
+                EmitAPInt(Vals64, Code, Abbrev, r.getHigh(), true);
+            }
+        }
+        Vals64.push_back(VE.getValueID(i.getCaseSuccessor()));
+      }
+      
+      Stream.EmitRecord(Code, Vals64, AbbrevToUse);
+      
+      // Also do expected action - clear external Vals collection:
+      Vals.clear();
+      return;
+    }
      break;
    case Instruction::IndirectBr:
      Code = bitc::FUNC_CODE_INST_INDIRECTBR;
      Vals.push_back(VE.getTypeID(I.getOperand(0)->getType()));
-    for (unsigned i = 0, e = I.getNumOperands(); i != e; ++i)
+    // Encode the address operand as relative, but not the basic blocks.
+    pushValue(I.getOperand(0), InstID, Vals, VE);
+    for (unsigned i = 1, e = I.getNumOperands(); i != e; ++i)
        Vals.push_back(VE.getValueID(I.getOperand(i)));
      break;
        
@@ -1137,7 +1259,7 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
  
      // Emit value #'s for the fixed parameters.
      for (unsigned i = 0, e = FTy->getNumParams(); i != e; ++i)
-      Vals.push_back(VE.getValueID(I.getOperand(i)));  // fixed param.
+      pushValue(I.getOperand(i), InstID, Vals, VE);  // fixed param.
  
      // Emit type/value pairs for varargs params.
      if (FTy->isVarArg()) {
@@ -1151,9 +1273,6 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
      Code = bitc::FUNC_CODE_INST_RESUME;
      PushValueAndType(I.getOperand(0), InstID, Vals, VE);
      break;
-  case Instruction::Unwind:
-    Code = bitc::FUNC_CODE_INST_UNWIND;
-    break;
    case Instruction::Unreachable:
      Code = bitc::FUNC_CODE_INST_UNREACHABLE;
      AbbrevToUse = FUNCTION_INST_UNREACHABLE_ABBREV;
@@ -1162,12 +1281,19 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
    case Instruction::PHI: {
      const PHINode &PN = cast<PHINode>(I);
      Code = bitc::FUNC_CODE_INST_PHI;
-    Vals.push_back(VE.getTypeID(PN.getType()));
+    // With the newer instruction encoding, forward references could give
+    // negative valued IDs.  This is most common for PHIs, so we use
+    // signed VBRs.
+    SmallVector<uint64_t, 128> Vals64;
+    Vals64.push_back(VE.getTypeID(PN.getType()));
      for (unsigned i = 0, e = PN.getNumIncomingValues(); i != e; ++i) {
-      Vals.push_back(VE.getValueID(PN.getIncomingValue(i)));
-      Vals.push_back(VE.getValueID(PN.getIncomingBlock(i)));
+      pushValueSigned(PN.getIncomingValue(i), InstID, Vals64, VE);
+      Vals64.push_back(VE.getValueID(PN.getIncomingBlock(i)));
      }
-    break;
+    // Emit a Vals64 vector and exit.
+    Stream.EmitRecord(Code, Vals64, AbbrevToUse);
+    Vals64.clear();
+    return;
    }
  
    case Instruction::LandingPad: {
@@ -1217,7 +1343,7 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
      else
        Code = bitc::FUNC_CODE_INST_STORE;
      PushValueAndType(I.getOperand(1), InstID, Vals, VE);  // ptrty + ptr
-    Vals.push_back(VE.getValueID(I.getOperand(0)));       // val.
+    pushValue(I.getOperand(0), InstID, Vals, VE);         // val.
      Vals.push_back(Log2_32(cast<StoreInst>(I).getAlignment())+1);
      Vals.push_back(cast<StoreInst>(I).isVolatile());
      if (cast<StoreInst>(I).isAtomic()) {
@@ -1228,8 +1354,8 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
    case Instruction::AtomicCmpXchg:
      Code = bitc::FUNC_CODE_INST_CMPXCHG;
      PushValueAndType(I.getOperand(0), InstID, Vals, VE);  // ptrty + ptr
-    Vals.push_back(VE.getValueID(I.getOperand(1)));       // cmp.
-    Vals.push_back(VE.getValueID(I.getOperand(2)));       // newval.
+    pushValue(I.getOperand(1), InstID, Vals, VE);         // cmp.
+    pushValue(I.getOperand(2), InstID, Vals, VE);         // newval.
      Vals.push_back(cast<AtomicCmpXchgInst>(I).isVolatile());
      Vals.push_back(GetEncodedOrdering(
                       cast<AtomicCmpXchgInst>(I).getOrdering()));
@@ -1239,7 +1365,7 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
    case Instruction::AtomicRMW:
      Code = bitc::FUNC_CODE_INST_ATOMICRMW;
      PushValueAndType(I.getOperand(0), InstID, Vals, VE);  // ptrty + ptr
-    Vals.push_back(VE.getValueID(I.getOperand(1)));       // val.
+    pushValue(I.getOperand(1), InstID, Vals, VE);         // val.
      Vals.push_back(GetEncodedRMWOperation(
                       cast<AtomicRMWInst>(I).getOperation()));
      Vals.push_back(cast<AtomicRMWInst>(I).isVolatile());
@@ -1264,8 +1390,13 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
      PushValueAndType(CI.getCalledValue(), InstID, Vals, VE);  // Callee
  
      // Emit value #'s for the fixed parameters.
-    for (unsigned i = 0, e = FTy->getNumParams(); i != e; ++i)
-      Vals.push_back(VE.getValueID(CI.getArgOperand(i)));  // fixed param.
+    for (unsigned i = 0, e = FTy->getNumParams(); i != e; ++i) {
+      // Check for labels (can happen with asm labels).
+      if (FTy->getParamType(i)->isLabelTy())
+        Vals.push_back(VE.getValueID(CI.getArgOperand(i)));
+      else
+        pushValue(CI.getArgOperand(i), InstID, Vals, VE);  // fixed param.
+    }
  
      // Emit type/value pairs for varargs params.
      if (FTy->isVarArg()) {
@@ -1278,7 +1409,7 @@ static void WriteInstruction(const Instruction &I, unsigned InstID,
    case Instruction::VAArg:
      Code = bitc::FUNC_CODE_INST_VAARG;
      Vals.push_back(VE.getTypeID(I.getOperand(0)->getType()));   // valistty
-    Vals.push_back(VE.getValueID(I.getOperand(0))); // valist.
+    pushValue(I.getOperand(0), InstID, Vals, VE); // valist.
      Vals.push_back(VE.getTypeID(I.getType())); // restype.
      break;
    }
@@ -1420,8 +1551,8 @@ static void WriteFunction(const Function &F, ValueEnumerator &VE,
  // Emit blockinfo, which defines the standard abbreviations etc.
  static void WriteBlockInfo(const ValueEnumerator &VE, BitstreamWriter &Stream) {
    // We only want to emit block info records for blocks that have multiple
-  // instances: CONSTANTS_BLOCK, FUNCTION_BLOCK and VALUE_SYMTAB_BLOCK.  Other
-  // blocks can defined their abbrevs inline.
+  // instances: CONSTANTS_BLOCK, FUNCTION_BLOCK and VALUE_SYMTAB_BLOCK.
+  // Other blocks can defined their abbrevs inline.
    Stream.EnterBlockInfoBlock(2);
  
    { // 8-bit fixed-width VST_ENTRY/VST_BBENTRY strings.
@@ -1578,17 +1709,99 @@ static void WriteBlockInfo(const ValueEnumerator &VE, BitstreamWriter &Stream) {
    Stream.ExitBlock();
  }
  
+// Sort the Users based on the order in which the reader parses the bitcode 
+// file.
+static bool bitcodereader_order(const User *lhs, const User *rhs) {
+  // TODO: Implement.
+  return true;
+}
+
+static void WriteUseList(const Value *V, const ValueEnumerator &VE,
+                         BitstreamWriter &Stream) {
+
+  // One or zero uses can't get out of order.
+  if (V->use_empty() || V->hasNUses(1))
+    return;
+
+  // Make a copy of the in-memory use-list for sorting.
+  unsigned UseListSize = std::distance(V->use_begin(), V->use_end());
+  SmallVector<const User*, 8> UseList;
+  UseList.reserve(UseListSize);
+  for (Value::const_use_iterator I = V->use_begin(), E = V->use_end();
+       I != E; ++I) {
+    const User *U = *I;
+    UseList.push_back(U);
+  }
+
+  // Sort the copy based on the order read by the BitcodeReader.
+  std::sort(UseList.begin(), UseList.end(), bitcodereader_order);
+
+  // TODO: Generate a diff between the BitcodeWriter in-memory use-list and the
+  // sorted list (i.e., the expected BitcodeReader in-memory use-list).
+
+  // TODO: Emit the USELIST_CODE_ENTRYs.
+}
+
+static void WriteFunctionUseList(const Function *F, ValueEnumerator &VE,
+                                 BitstreamWriter &Stream) {
+  VE.incorporateFunction(*F);
+
+  for (Function::const_arg_iterator AI = F->arg_begin(), AE = F->arg_end();
+       AI != AE; ++AI)
+    WriteUseList(AI, VE, Stream);
+  for (Function::const_iterator BB = F->begin(), FE = F->end(); BB != FE;
+       ++BB) {
+    WriteUseList(BB, VE, Stream);
+    for (BasicBlock::const_iterator II = BB->begin(), IE = BB->end(); II != IE;
+         ++II) {
+      WriteUseList(II, VE, Stream);
+      for (User::const_op_iterator OI = II->op_begin(), E = II->op_end();
+           OI != E; ++OI) {
+        if ((isa<Constant>(*OI) && !isa<GlobalValue>(*OI)) ||
+            isa<InlineAsm>(*OI))
+          WriteUseList(*OI, VE, Stream);
+      }
+    }
+  }
+  VE.purgeFunction();
+}
+
  // Emit use-lists.
  static void WriteModuleUseLists(const Module *M, ValueEnumerator &VE,
                                  BitstreamWriter &Stream) {
    Stream.EnterSubblock(bitc::USELIST_BLOCK_ID, 3);
  
-  // Emit a bogus record for testing purposes.
-  SmallVector<uint64_t, 64> Record;
-  Record.push_back(0);
-  Stream.EmitRecord(bitc::USELIST_CODE_ENTRY, Record);
+  // XXX: this modifies the module, but in a way that should never change the
+  // behavior of any pass or codegen in LLVM. The problem is that GVs may
+  // contain entries in the use_list that do not exist in the Module and are
+  // not stored in the .bc file.
+  for (Module::const_global_iterator I = M->global_begin(), E = M->global_end();
+       I != E; ++I)
+    I->removeDeadConstantUsers();
+  
+  // Write the global variables.
+  for (Module::const_global_iterator GI = M->global_begin(), 
+         GE = M->global_end(); GI != GE; ++GI) {
+    WriteUseList(GI, VE, Stream);
+
+    // Write the global variable initializers.
+    if (GI->hasInitializer())
+      WriteUseList(GI->getInitializer(), VE, Stream);
+  }
  
-  // TODO: Tons.
+  // Write the functions.
+  for (Module::const_iterator FI = M->begin(), FE = M->end(); FI != FE; ++FI) {
+    WriteUseList(FI, VE, Stream);
+    if (!FI->isDeclaration())
+      WriteFunctionUseList(FI, VE, Stream);
+  }
+
+  // Write the aliases.
+  for (Module::const_alias_iterator AI = M->alias_begin(), AE = M->alias_end();
+       AI != AE; ++AI) {
+    WriteUseList(AI, VE, Stream);
+    WriteUseList(AI->getAliasee(), VE, Stream);
+  }
  
    Stream.ExitBlock();
  }
@@ -1597,12 +1810,10 @@ static void WriteModuleUseLists(const Module *M, ValueEnumerator &VE,
  static void WriteModule(const Module *M, BitstreamWriter &Stream) {
    Stream.EnterSubblock(bitc::MODULE_BLOCK_ID, 3);
  
-  // Emit the version number if it is non-zero.
-  if (CurVersion) {
-    SmallVector<unsigned, 1> Vals;
-    Vals.push_back(CurVersion);
-    Stream.EmitRecord(bitc::MODULE_CODE_VERSION, Vals);
-  }
+  SmallVector<unsigned, 1> Vals;
+  unsigned CurVersion = 1;
+  Vals.push_back(CurVersion);
+  Stream.EmitRecord(bitc::MODULE_CODE_VERSION, Vals);
  
    // Analyze the module, enumerating globals, functions, etc.
    ValueEnumerator VE(M);
@@ -1626,11 +1837,6 @@ static void WriteModule(const Module *M, BitstreamWriter &Stream) {
    // Emit metadata.
    WriteModuleMetadata(M, VE, Stream);
  
-  // Emit function bodies.
-  for (Module::const_iterator F = M->begin(), E = M->end(); F != E; ++F)
-    if (!F->isDeclaration())
-      WriteFunction(*F, VE, Stream);
-
    // Emit metadata.
    WriteModuleMetadataStore(M, Stream);
  
@@ -1641,6 +1847,11 @@ static void WriteModule(const Module *M, BitstreamWriter &Stream) {
    if (EnablePreserveUseListOrdering)
      WriteModuleUseLists(M, VE, Stream);
  
+  // Emit function bodies.
+  for (Module::const_iterator F = M->begin(), E = M->end(); F != E; ++F)
+    if (!F->isDeclaration())
+      WriteFunction(*F, VE, Stream);
+
    Stream.ExitBlock();
  }
  
@@ -1662,7 +1873,17 @@ enum {
    DarwinBCHeaderSize = 5*4
  };
  
-static void EmitDarwinBCHeader(BitstreamWriter &Stream, const Triple &TT) {
+static void WriteInt32ToBuffer(uint32_t Value, SmallVectorImpl<char> &Buffer,
+                               uint32_t &Position) {
+  Buffer[Position + 0] = (unsigned char) (Value >>  0);
+  Buffer[Position + 1] = (unsigned char) (Value >>  8);
+  Buffer[Position + 2] = (unsigned char) (Value >> 16);
+  Buffer[Position + 3] = (unsigned char) (Value >> 24);
+  Position += 4;
+}
+
+static void EmitDarwinBCHeaderAndTrailer(SmallVectorImpl<char> &Buffer,
+                                         const Triple &TT) {
    unsigned CPUType = ~0U;
  
    // Match x86_64-*, i[3-9]86-*, powerpc-*, powerpc64-*, arm-*, thumb-*,
@@ -1689,63 +1910,55 @@ static void EmitDarwinBCHeader(BitstreamWriter &Stream, const Triple &TT) {
      CPUType = DARWIN_CPU_TYPE_ARM;
  
    // Traditional Bitcode starts after header.
+  assert(Buffer.size() >= DarwinBCHeaderSize &&
+         "Expected header size to be reserved");
    unsigned BCOffset = DarwinBCHeaderSize;
+  unsigned BCSize = Buffer.size()-DarwinBCHeaderSize;
  
-  Stream.Emit(0x0B17C0DE, 32);
-  Stream.Emit(0         , 32);  // Version.
-  Stream.Emit(BCOffset  , 32);
-  Stream.Emit(0         , 32);  // Filled in later.
-  Stream.Emit(CPUType   , 32);
-}
-
-/// EmitDarwinBCTrailer - Emit the darwin epilog after the bitcode file and
-/// finalize the header.
-static void EmitDarwinBCTrailer(BitstreamWriter &Stream, unsigned BufferSize) {
-  // Update the size field in the header.
-  Stream.BackpatchWord(DarwinBCSizeFieldOffset, BufferSize-DarwinBCHeaderSize);
+  // Write the magic and version.
+  unsigned Position = 0;
+  WriteInt32ToBuffer(0x0B17C0DE , Buffer, Position);
+  WriteInt32ToBuffer(0          , Buffer, Position); // Version.
+  WriteInt32ToBuffer(BCOffset   , Buffer, Position);
+  WriteInt32ToBuffer(BCSize     , Buffer, Position);
+  WriteInt32ToBuffer(CPUType    , Buffer, Position);
  
    // If the file is not a multiple of 16 bytes, insert dummy padding.
-  while (BufferSize & 15) {
-    Stream.Emit(0, 8);
-    ++BufferSize;
-  }
+  while (Buffer.size() & 15)
+    Buffer.push_back(0);
  }
  
-
  /// WriteBitcodeToFile - Write the specified module to the specified output
  /// stream.
  void llvm::WriteBitcodeToFile(const Module *M, raw_ostream &Out) {
-  std::vector<unsigned char> Buffer;
-  BitstreamWriter Stream(Buffer);
-
+  SmallVector<char, 1024> Buffer;
    Buffer.reserve(256*1024);
  
-  WriteBitcodeToStream( M, Stream );
-
-  // Write the generated bitstream to "Out".
-  Out.write((char*)&Buffer.front(), Buffer.size());
-}
-
-/// WriteBitcodeToStream - Write the specified module to the specified output
-/// stream.
-void llvm::WriteBitcodeToStream(const Module *M, BitstreamWriter &Stream) {
-  // If this is darwin or another generic macho target, emit a file header and
-  // trailer if needed.
+  // If this is darwin or another generic macho target, reserve space for the
+  // header.
    Triple TT(M->getTargetTriple());
    if (TT.isOSDarwin())
-    EmitDarwinBCHeader(Stream, TT);
-
-  // Emit the file header.
-  Stream.Emit((unsigned)'B', 8);
-  Stream.Emit((unsigned)'C', 8);
-  Stream.Emit(0x0, 4);
-  Stream.Emit(0xC, 4);
-  Stream.Emit(0xE, 4);
-  Stream.Emit(0xD, 4);
-
-  // Emit the module.
-  WriteModule(M, Stream);
+    Buffer.insert(Buffer.begin(), DarwinBCHeaderSize, 0);
+
+  // Emit the module into the buffer.
+  {
+    BitstreamWriter Stream(Buffer);
+
+    // Emit the file header.
+    Stream.Emit((unsigned)'B', 8);
+    Stream.Emit((unsigned)'C', 8);
+    Stream.Emit(0x0, 4);
+    Stream.Emit(0xC, 4);
+    Stream.Emit(0xE, 4);
+    Stream.Emit(0xD, 4);
+
+    // Emit the module.
+    WriteModule(M, Stream);
+  }
  
    if (TT.isOSDarwin())
-    EmitDarwinBCTrailer(Stream, Stream.getBuffer().size());
+    EmitDarwinBCHeaderAndTrailer(Buffer, TT);
+
+  // Write the generated bitstream to "Out".
+  Out.write((char*)&Buffer.front(), Buffer.size());
  }