Nuke no longer accurate comment.

[oota-llvm.git] / lib / Target / ARM / AsmParser / ARMAsmParser.cpp
diff --git a/lib/Target/ARM/AsmParser/ARMAsmParser.cpp b/lib/Target/ARM/AsmParser/ARMAsmParser.cpp

index 3a60ff94d9bd90316eaf3e426068e189b6dc9273..af7fe33258f4b0ec8f4441398598e8420d95be27 100644 (file)
--- a/lib/Target/ARM/AsmParser/ARMAsmParser.cpp
+++ b/lib/Target/ARM/AsmParser/ARMAsmParser.cpp
@@ -30,7 +30,6 @@
  #include "llvm/ADT/OwningPtr.h"
  #include "llvm/ADT/STLExtras.h"
  #include "llvm/ADT/SmallVector.h"
-#include "llvm/ADT/StringExtras.h"
  #include "llvm/ADT/StringSwitch.h"
  #include "llvm/ADT/Twine.h"
  
@@ -198,10 +197,18 @@ class ARMAsmParser : public MCTargetAsmParser {
                                    const SmallVectorImpl<MCParsedAsmOperand*> &);
    bool cvtThumbMultiply(MCInst &Inst, unsigned Opcode,
                          const SmallVectorImpl<MCParsedAsmOperand*> &);
+  bool cvtVLDwbFixed(MCInst &Inst, unsigned Opcode,
+                     const SmallVectorImpl<MCParsedAsmOperand*> &);
+  bool cvtVLDwbRegister(MCInst &Inst, unsigned Opcode,
+                        const SmallVectorImpl<MCParsedAsmOperand*> &);
+  bool cvtVSTwbFixed(MCInst &Inst, unsigned Opcode,
+                     const SmallVectorImpl<MCParsedAsmOperand*> &);
+  bool cvtVSTwbRegister(MCInst &Inst, unsigned Opcode,
+                        const SmallVectorImpl<MCParsedAsmOperand*> &);
  
    bool validateInstruction(MCInst &Inst,
                             const SmallVectorImpl<MCParsedAsmOperand*> &Ops);
-  void processInstruction(MCInst &Inst,
+  bool processInstruction(MCInst &Inst,
                            const SmallVectorImpl<MCParsedAsmOperand*> &Ops);
    bool shouldOmitCCOutOperand(StringRef Mnemonic,
                                SmallVectorImpl<MCParsedAsmOperand*> &Operands);
@@ -595,6 +602,14 @@ public:
      int64_t Value = CE->getValue();
      return Value > 0 && Value < 33;
    }
+  bool isImm0_32() const {
+    if (Kind != k_Immediate)
+      return false;
+    const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
+    if (!CE) return false;
+    int64_t Value = CE->getValue();
+    return Value >= 0 && Value < 33;
+  }
    bool isImm0_65535() const {
      if (Kind != k_Immediate)
        return false;
@@ -653,6 +668,14 @@ public:
      int64_t Value = CE->getValue();
      return ARM_AM::getSOImmVal(Value) != -1;
    }
+  bool isARMSOImmNot() const {
+    if (Kind != k_Immediate)
+      return false;
+    const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
+    if (!CE) return false;
+    int64_t Value = CE->getValue();
+    return ARM_AM::getSOImmVal(~Value) != -1;
+  }
    bool isT2SOImm() const {
      if (Kind != k_Immediate)
        return false;
@@ -661,6 +684,14 @@ public:
      int64_t Value = CE->getValue();
      return ARM_AM::getT2SOImmVal(Value) != -1;
    }
+  bool isT2SOImmNot() const {
+    if (Kind != k_Immediate)
+      return false;
+    const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
+    if (!CE) return false;
+    int64_t Value = CE->getValue();
+    return ARM_AM::getT2SOImmVal(~Value) != -1;
+  }
    bool isSetEndImm() const {
      if (Kind != k_Immediate)
        return false;
@@ -737,6 +768,11 @@ public:
      return (Val > -256 && Val < 256) || Val == INT32_MIN;
    }
    bool isAddrMode5() const {
+    // If we have an immediate that's not a constant, treat it as a label
+    // reference needing a fixup. If it is a constant, it's something else
+    // and we reject it.
+    if (Kind == k_Immediate && !isa<MCConstantExpr>(getImm()))
+      return true;
      if (!isMemory() || Memory.Alignment != 0) return false;
      // Check for register offset.
      if (Memory.OffsetRegNum) return false;
@@ -744,7 +780,7 @@ public:
      if (!Memory.OffsetImm) return true;
      int64_t Val = Memory.OffsetImm->getValue();
      return (Val >= -1020 && Val <= 1020 && ((Val & 3) == 0)) ||
-           Val == INT32_MIN;
+      Val == INT32_MIN;
    }
    bool isMemTBB() const {
      if (!isMemory() || !Memory.OffsetRegNum || Memory.isNegative ||
@@ -861,12 +897,6 @@ public:
      return Val > -256 && Val < 0;
    }
    bool isMemUImm12Offset() const {
-    // If we have an immediate that's not a constant, treat it as a label
-    // reference needing a fixup. If it is a constant, it's something else
-    // and we reject it.
-    if (Kind == k_Immediate && !isa<MCConstantExpr>(getImm()))
-      return true;
-
      if (!isMemory() || Memory.OffsetRegNum != 0 || Memory.Alignment != 0)
        return false;
      // Immediate offset in range [0, 4095].
@@ -1195,6 +1225,11 @@ public:
      Inst.addOperand(MCOperand::CreateImm(CE->getValue() - 1));
    }
  
+  void addImm0_32Operands(MCInst &Inst, unsigned N) const {
+    assert(N == 1 && "Invalid number of operands!");
+    addExpr(Inst, getImm());
+  }
+
    void addImm0_65535Operands(MCInst &Inst, unsigned N) const {
      assert(N == 1 && "Invalid number of operands!");
      addExpr(Inst, getImm());
@@ -1243,6 +1278,22 @@ public:
      addExpr(Inst, getImm());
    }
  
+  void addT2SOImmNotOperands(MCInst &Inst, unsigned N) const {
+    assert(N == 1 && "Invalid number of operands!");
+    // The operand is actually a t2_so_imm, but we have its bitwise
+    // negation in the assembly source, so twiddle it here.
+    const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
+    Inst.addOperand(MCOperand::CreateImm(~CE->getValue()));
+  }
+
+  void addARMSOImmNotOperands(MCInst &Inst, unsigned N) const {
+    assert(N == 1 && "Invalid number of operands!");
+    // The operand is actually a so_imm, but we have its bitwise
+    // negation in the assembly source, so twiddle it here.
+    const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
+    Inst.addOperand(MCOperand::CreateImm(~CE->getValue()));
+  }
+
    void addSetEndImmOperands(MCInst &Inst, unsigned N) const {
      assert(N == 1 && "Invalid number of operands!");
      addExpr(Inst, getImm());
@@ -1341,6 +1392,15 @@ public:
  
    void addAddrMode5Operands(MCInst &Inst, unsigned N) const {
      assert(N == 2 && "Invalid number of operands!");
+    // If we have an immediate that's not a constant, treat it as a label
+    // reference needing a fixup. If it is a constant, it's something else
+    // and we reject it.
+    if (isImm()) {
+      Inst.addOperand(MCOperand::CreateExpr(getImm()));
+      Inst.addOperand(MCOperand::CreateImm(0));
+      return;
+    }
+
      // The lower two bits are always zero and as such are not encoded.
      int32_t Val = Memory.OffsetImm ? Memory.OffsetImm->getValue() / 4 : 0;
      ARM_AM::AddrOpc AddSub = Val < 0 ? ARM_AM::sub : ARM_AM::add;
@@ -1886,9 +1946,10 @@ void ARMOperand::print(raw_ostream &OS) const {
      OS << "<ccout " << getReg() << ">";
      break;
    case k_ITCondMask: {
-    static char MaskStr[][6] = { "()", "(t)", "(e)", "(tt)", "(et)", "(te)",
-      "(ee)", "(ttt)", "(ett)", "(tet)", "(eet)", "(tte)", "(ete)",
-      "(tee)", "(eee)" };
+    static const char *MaskStr[] = {
+      "()", "(t)", "(e)", "(tt)", "(et)", "(te)", "(ee)", "(ttt)", "(ett)",
+      "(tet)", "(eet)", "(tte)", "(ete)", "(tee)", "(eee)"
+    };
      assert((ITMask.Mask & 0xf) == ITMask.Mask);
      OS << "<it-mask " << MaskStr[ITMask.Mask] << ">";
      break;
@@ -2014,8 +2075,7 @@ int ARMAsmParser::tryParseRegister() {
  
    // FIXME: Validate register for the current architecture; we have to do
    // validation later, so maybe there is no need for this here.
-  std::string upperCase = Tok.getString().str();
-  std::string lowerCase = LowercaseString(upperCase);
+  std::string lowerCase = Tok.getString().lower();
    unsigned RegNum = MatchRegisterName(lowerCase);
    if (!RegNum) {
      RegNum = StringSwitch<unsigned>(lowerCase)
@@ -2043,8 +2103,7 @@ int ARMAsmParser::tryParseShiftRegister(
    const AsmToken &Tok = Parser.getTok();
    assert(Tok.is(AsmToken::Identifier) && "Token is not an Identifier");
  
-  std::string upperCase = Tok.getString().str();
-  std::string lowerCase = LowercaseString(upperCase);
+  std::string lowerCase = Tok.getString().lower();
    ARM_AM::ShiftOpc ShiftTy = StringSwitch<ARM_AM::ShiftOpc>(lowerCase)
        .Case("lsl", ARM_AM::lsl)
        .Case("lsr", ARM_AM::lsr)
@@ -2351,6 +2410,29 @@ static unsigned getNextRegister(unsigned Reg) {
    }
  }
  
+// Return the low-subreg of a given Q register.
+static unsigned getDRegFromQReg(unsigned QReg) {
+  switch (QReg) {
+  default: llvm_unreachable("expected a Q register!");
+  case ARM::Q0:  return ARM::D0;
+  case ARM::Q1:  return ARM::D2;
+  case ARM::Q2:  return ARM::D4;
+  case ARM::Q3:  return ARM::D6;
+  case ARM::Q4:  return ARM::D8;
+  case ARM::Q5:  return ARM::D10;
+  case ARM::Q6:  return ARM::D12;
+  case ARM::Q7:  return ARM::D14;
+  case ARM::Q8:  return ARM::D16;
+  case ARM::Q9:  return ARM::D19;
+  case ARM::Q10: return ARM::D20;
+  case ARM::Q11: return ARM::D22;
+  case ARM::Q12: return ARM::D24;
+  case ARM::Q13: return ARM::D26;
+  case ARM::Q14: return ARM::D28;
+  case ARM::Q15: return ARM::D30;
+  }
+}
+
  /// Parse a register list.
  bool ARMAsmParser::
  parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
@@ -2366,7 +2448,17 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
    if (Reg == -1)
      return Error(RegLoc, "register expected");
  
-  MCRegisterClass *RC;
+  // The reglist instructions have at most 16 registers, so reserve
+  // space for that many.
+  SmallVector<std::pair<unsigned, SMLoc>, 16> Registers;
+
+  // Allow Q regs and just interpret them as the two D sub-registers.
+  if (ARMMCRegisterClasses[ARM::QPRRegClassID].contains(Reg)) {
+    Reg = getDRegFromQReg(Reg);
+    Registers.push_back(std::pair<unsigned, SMLoc>(Reg, RegLoc));
+    ++Reg;
+  }
+  const MCRegisterClass *RC;
    if (ARMMCRegisterClasses[ARM::GPRRegClassID].contains(Reg))
      RC = &ARMMCRegisterClasses[ARM::GPRRegClassID];
    else if (ARMMCRegisterClasses[ARM::DPRRegClassID].contains(Reg))
@@ -2376,10 +2468,7 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
    else
      return Error(RegLoc, "invalid register in register list");
  
-  // The reglist instructions have at most 16 registers, so reserve
-  // space for that many.
-  SmallVector<std::pair<unsigned, SMLoc>, 16> Registers;
-  // Store the first register.
+  // Store the register.
    Registers.push_back(std::pair<unsigned, SMLoc>(Reg, RegLoc));
  
    // This starts immediately after the first register token in the list,
@@ -2393,6 +2482,9 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
        int EndReg = tryParseRegister();
        if (EndReg == -1)
          return Error(EndLoc, "register expected");
+      // Allow Q regs and just interpret them as the two D sub-registers.
+      if (ARMMCRegisterClasses[ARM::QPRRegClassID].contains(EndReg))
+        EndReg = getDRegFromQReg(EndReg) + 1;
        // If the register is the same as the start reg, there's nothing
        // more to do.
        if (Reg == EndReg)
@@ -2417,6 +2509,12 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
      Reg = tryParseRegister();
      if (Reg == -1)
        return Error(RegLoc, "register expected");
+    // Allow Q regs and just interpret them as the two D sub-registers.
+    bool isQReg = false;
+    if (ARMMCRegisterClasses[ARM::QPRRegClassID].contains(Reg)) {
+      Reg = getDRegFromQReg(Reg);
+      isQReg = true;
+    }
      // The register must be in the same register class as the first.
      if (!RC->contains(Reg))
        return Error(RegLoc, "invalid register in register list");
@@ -2430,6 +2528,8 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
          Reg != OldReg + 1)
        return Error(RegLoc, "non-contiguous register range");
      Registers.push_back(std::pair<unsigned, SMLoc>(Reg, RegLoc));
+    if (isQReg)
+      Registers.push_back(std::pair<unsigned, SMLoc>(++Reg, RegLoc));
    }
  
    SMLoc E = Parser.getTok().getLoc();
@@ -2456,9 +2556,16 @@ parseVectorList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
      Error(RegLoc, "register expected");
      return MatchOperand_ParseFail;
    }
-
-  unsigned FirstReg = Reg;
    unsigned Count = 1;
+  unsigned FirstReg = Reg;
+  // The list is of D registers, but we also allow Q regs and just interpret
+  // them as the two D sub-registers.
+  if (ARMMCRegisterClasses[ARM::QPRRegClassID].contains(Reg)) {
+    FirstReg = Reg = getDRegFromQReg(Reg);
+    ++Reg;
+    ++Count;
+  }
+
    while (Parser.getTok().is(AsmToken::Comma)) {
      Parser.Lex(); // Eat the comma.
      RegLoc = Parser.getTok().getLoc();
@@ -2468,14 +2575,27 @@ parseVectorList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
        Error(RegLoc, "register expected");
        return MatchOperand_ParseFail;
      }
-    // vector register lists must also be contiguous.
+    // vector register lists must be contiguous.
      // It's OK to use the enumeration values directly here rather, as the
      // VFP register classes have the enum sorted properly.
+    //
+    // The list is of D registers, but we also allow Q regs and just interpret
+    // them as the two D sub-registers.
+    if (ARMMCRegisterClasses[ARM::QPRRegClassID].contains(Reg)) {
+      Reg = getDRegFromQReg(Reg);
+      if (Reg != OldReg + 1) {
+        Error(RegLoc, "non-contiguous register range");
+        return MatchOperand_ParseFail;
+      }
+      ++Reg;
+      Count += 2;
+      continue;
+    }
+    // Normal D register. Just check that it's contiguous and keep going.
      if (Reg != OldReg + 1) {
        Error(RegLoc, "non-contiguous register range");
        return MatchOperand_ParseFail;
      }
-
      ++Count;
    }
  
@@ -2596,7 +2716,7 @@ parseMSRMaskOperand(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
    // Split spec_reg from flag, example: CPSR_sxf => "CPSR" and "sxf"
    size_t Start = 0, Next = Mask.find('_');
    StringRef Flags = "";
-  std::string SpecReg = LowercaseString(Mask.slice(Start, Next));
+  std::string SpecReg = Mask.slice(Start, Next).lower();
    if (Next != StringRef::npos)
      Flags = Mask.slice(Next+1, Mask.size());
  
@@ -2664,8 +2784,8 @@ parsePKHImm(SmallVectorImpl<MCParsedAsmOperand*> &Operands, StringRef Op,
      return MatchOperand_ParseFail;
    }
    StringRef ShiftName = Tok.getString();
-  std::string LowerOp = LowercaseString(Op);
-  std::string UpperOp = UppercaseString(Op);
+  std::string LowerOp = Op.lower();
+  std::string UpperOp = Op.upper();
    if (ShiftName != LowerOp && ShiftName != UpperOp) {
      Error(Parser.getTok().getLoc(), Op + " operand expected.");
      return MatchOperand_ParseFail;
@@ -3313,18 +3433,80 @@ cvtThumbMultiply(MCInst &Inst, unsigned Opcode,
    }
    ((ARMOperand*)Operands[3])->addRegOperands(Inst, 1);
    ((ARMOperand*)Operands[1])->addCCOutOperands(Inst, 1);
-  ((ARMOperand*)Operands[4])->addRegOperands(Inst, 1);
-  // If we have a three-operand form, use that, else the second source operand
-  // is just the destination operand again.
-  if (Operands.size() == 6)
-    ((ARMOperand*)Operands[5])->addRegOperands(Inst, 1);
-  else
-    Inst.addOperand(Inst.getOperand(0));
+  // If we have a three-operand form, make sure to set Rn to be the operand
+  // that isn't the same as Rd.
+  unsigned RegOp = 4;
+  if (Operands.size() == 6 &&
+      ((ARMOperand*)Operands[4])->getReg() ==
+        ((ARMOperand*)Operands[3])->getReg())
+    RegOp = 5;
+  ((ARMOperand*)Operands[RegOp])->addRegOperands(Inst, 1);
+  Inst.addOperand(Inst.getOperand(0));
    ((ARMOperand*)Operands[2])->addCondCodeOperands(Inst, 2);
  
    return true;
  }
  
+bool ARMAsmParser::
+cvtVLDwbFixed(MCInst &Inst, unsigned Opcode,
+              const SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
+  // Vd
+  ((ARMOperand*)Operands[3])->addVecListTwoDOperands(Inst, 1);
+  // Create a writeback register dummy placeholder.
+  Inst.addOperand(MCOperand::CreateImm(0));
+  // Vn
+  ((ARMOperand*)Operands[4])->addAlignedMemoryOperands(Inst, 2);
+  // pred
+  ((ARMOperand*)Operands[1])->addCondCodeOperands(Inst, 2);
+  return true;
+}
+
+bool ARMAsmParser::
+cvtVLDwbRegister(MCInst &Inst, unsigned Opcode,
+                 const SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
+  // Vd
+  ((ARMOperand*)Operands[3])->addVecListTwoDOperands(Inst, 1);
+  // Create a writeback register dummy placeholder.
+  Inst.addOperand(MCOperand::CreateImm(0));
+  // Vn
+  ((ARMOperand*)Operands[4])->addAlignedMemoryOperands(Inst, 2);
+  // Vm
+  ((ARMOperand*)Operands[5])->addRegOperands(Inst, 1);
+  // pred
+  ((ARMOperand*)Operands[1])->addCondCodeOperands(Inst, 2);
+  return true;
+}
+
+bool ARMAsmParser::
+cvtVSTwbFixed(MCInst &Inst, unsigned Opcode,
+              const SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
+  // Create a writeback register dummy placeholder.
+  Inst.addOperand(MCOperand::CreateImm(0));
+  // Vn
+  ((ARMOperand*)Operands[4])->addAlignedMemoryOperands(Inst, 2);
+  // Vt
+  ((ARMOperand*)Operands[3])->addVecListTwoDOperands(Inst, 1);
+  // pred
+  ((ARMOperand*)Operands[1])->addCondCodeOperands(Inst, 2);
+  return true;
+}
+
+bool ARMAsmParser::
+cvtVSTwbRegister(MCInst &Inst, unsigned Opcode,
+                 const SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
+  // Create a writeback register dummy placeholder.
+  Inst.addOperand(MCOperand::CreateImm(0));
+  // Vn
+  ((ARMOperand*)Operands[4])->addAlignedMemoryOperands(Inst, 2);
+  // Vm
+  ((ARMOperand*)Operands[5])->addRegOperands(Inst, 1);
+  // Vt
+  ((ARMOperand*)Operands[3])->addVecListTwoDOperands(Inst, 1);
+  // pred
+  ((ARMOperand*)Operands[1])->addCondCodeOperands(Inst, 2);
+  return true;
+}
+
  /// Parse an ARM memory expression, return false if successful else return true
  /// or an error.  The first token must be a '[' when called.
  bool ARMAsmParser::
@@ -3656,7 +3838,9 @@ bool ARMAsmParser::parseOperand(SmallVectorImpl<MCParsedAsmOperand*> &Operands,
      // Fall though for the Identifier case that is not a register or a
      // special name.
    }
+  case AsmToken::LParen:  // parenthesized expressions like (_strcmp-4)
    case AsmToken::Integer: // things like 1f and 2b as a branch targets
+  case AsmToken::String:  // quoted label names.
    case AsmToken::Dot: {   // . as a branch target
      // This was not a register so parse other operands that start with an
      // identifier (like labels) as expressions and create them as immediates.
@@ -3682,13 +3866,11 @@ bool ARMAsmParser::parseOperand(SmallVectorImpl<MCParsedAsmOperand*> &Operands,
      if (getParser().ParseExpression(ImmVal))
        return true;
      const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(ImmVal);
-    if (!CE) {
-      Error(S, "constant expression expected");
-      return MatchOperand_ParseFail;
+    if (CE) {
+      int32_t Val = CE->getValue();
+      if (isNegative && Val == 0)
+        ImmVal = MCConstantExpr::Create(INT32_MIN, getContext());
      }
-    int32_t Val = CE->getValue();
-    if (isNegative && Val == 0)
-      ImmVal = MCConstantExpr::Create(INT32_MIN, getContext());
      E = SMLoc::getFromPointer(Parser.getTok().getLoc().getPointer() - 1);
      Operands.push_back(ARMOperand::CreateImm(ImmVal, S, E));
      return false;
@@ -4101,9 +4283,6 @@ bool ARMAsmParser::ParseInstruction(StringRef Name, SMLoc NameLoc,
      Next = Name.find('.', Start + 1);
      StringRef ExtraToken = Name.slice(Start, Next);
  
-    // For now, we're only parsing Thumb1 (for the most part), so
-    // just ignore ".n" qualifiers. We'll use them to restrict
-    // matching when we do Thumb2.
      if (ExtraToken != ".n") {
        SMLoc Loc = SMLoc::getFromPointer(NameLoc.getPointer() + Start);
        Operands.push_back(ARMOperand::CreateToken(ExtraToken, Loc));
@@ -4237,9 +4416,9 @@ static bool listContainsReg(MCInst &Inst, unsigned OpNo, unsigned Reg) {
  // the ARMInsts array) instead. Getting that here requires awkward
  // API changes, though. Better way?
  namespace llvm {
-extern MCInstrDesc ARMInsts[];
+extern const MCInstrDesc ARMInsts[];
  }
-static MCInstrDesc &getInstDesc(unsigned Opcode) {
+static const MCInstrDesc &getInstDesc(unsigned Opcode) {
    return ARMInsts[Opcode];
  }
  
@@ -4247,7 +4426,7 @@ static MCInstrDesc &getInstDesc(unsigned Opcode) {
  bool ARMAsmParser::
  validateInstruction(MCInst &Inst,
                      const SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
-  MCInstrDesc &MCID = getInstDesc(Inst.getOpcode());
+  const MCInstrDesc &MCID = getInstDesc(Inst.getOpcode());
    SMLoc Loc = Operands[0]->getStartLoc();
    // Check the IT block state first.
    // NOTE: In Thumb mode, the BKPT instruction has the interesting property of
@@ -4362,16 +4541,21 @@ validateInstruction(MCInst &Inst,
                     "in register list");
      break;
    }
+  // Like for ldm/stm, push and pop have hi-reg handling version in Thumb2,
+  // so only issue a diagnostic for thumb1. The instructions will be
+  // switched to the t2 encodings in processInstruction() if necessary.
    case ARM::tPOP: {
      bool listContainsBase;
-    if (checkLowRegisterList(Inst, 3, 0, ARM::PC, listContainsBase))
+    if (checkLowRegisterList(Inst, 2, 0, ARM::PC, listContainsBase) &&
+        !isThumbTwo())
        return Error(Operands[2]->getStartLoc(),
                     "registers must be in range r0-r7 or pc");
      break;
    }
    case ARM::tPUSH: {
      bool listContainsBase;
-    if (checkLowRegisterList(Inst, 3, 0, ARM::LR, listContainsBase))
+    if (checkLowRegisterList(Inst, 2, 0, ARM::LR, listContainsBase) &&
+        !isThumbTwo())
        return Error(Operands[2]->getStartLoc(),
                     "registers must be in range r0-r7 or lr");
      break;
@@ -4388,10 +4572,71 @@ validateInstruction(MCInst &Inst,
    return false;
  }
  
-void ARMAsmParser::
+bool ARMAsmParser::
  processInstruction(MCInst &Inst,
                     const SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
    switch (Inst.getOpcode()) {
+  // Handle the MOV complex aliases.
+  case ARM::ASRi:
+  case ARM::LSRi:
+  case ARM::LSLi:
+  case ARM::RORi: {
+    ARM_AM::ShiftOpc ShiftTy;
+    unsigned Amt = Inst.getOperand(2).getImm();
+    switch(Inst.getOpcode()) {
+    default: llvm_unreachable("unexpected opcode!");
+    case ARM::ASRi: ShiftTy = ARM_AM::asr; break;
+    case ARM::LSRi: ShiftTy = ARM_AM::lsr; break;
+    case ARM::LSLi: ShiftTy = ARM_AM::lsl; break;
+    case ARM::RORi: ShiftTy = ARM_AM::ror; break;
+    }
+    // A shift by zero is a plain MOVr, not a MOVsi.
+    unsigned Opc = Amt == 0 ? ARM::MOVr : ARM::MOVsi;
+    unsigned Shifter = ARM_AM::getSORegOpc(ShiftTy, Amt);
+    MCInst TmpInst;
+    TmpInst.setOpcode(Opc);
+    TmpInst.addOperand(Inst.getOperand(0)); // Rd
+    TmpInst.addOperand(Inst.getOperand(1)); // Rn
+    if (Opc == ARM::MOVsi)
+      TmpInst.addOperand(MCOperand::CreateImm(Shifter)); // Shift value and ty
+    TmpInst.addOperand(Inst.getOperand(3)); // CondCode
+    TmpInst.addOperand(Inst.getOperand(4));
+    TmpInst.addOperand(Inst.getOperand(5)); // cc_out
+    Inst = TmpInst;
+    return true;
+  }
+  case ARM::t2LDMIA_UPD: {
+    // If this is a load of a single register, then we should use
+    // a post-indexed LDR instruction instead, per the ARM ARM.
+    if (Inst.getNumOperands() != 5)
+      return false;
+    MCInst TmpInst;
+    TmpInst.setOpcode(ARM::t2LDR_POST);
+    TmpInst.addOperand(Inst.getOperand(4)); // Rt
+    TmpInst.addOperand(Inst.getOperand(0)); // Rn_wb
+    TmpInst.addOperand(Inst.getOperand(1)); // Rn
+    TmpInst.addOperand(MCOperand::CreateImm(4));
+    TmpInst.addOperand(Inst.getOperand(2)); // CondCode
+    TmpInst.addOperand(Inst.getOperand(3));
+    Inst = TmpInst;
+    return true;
+  }
+  case ARM::t2STMDB_UPD: {
+    // If this is a store of a single register, then we should use
+    // a pre-indexed STR instruction instead, per the ARM ARM.
+    if (Inst.getNumOperands() != 5)
+      return false;
+    MCInst TmpInst;
+    TmpInst.setOpcode(ARM::t2STR_PRE);
+    TmpInst.addOperand(Inst.getOperand(0)); // Rn_wb
+    TmpInst.addOperand(Inst.getOperand(4)); // Rt
+    TmpInst.addOperand(Inst.getOperand(1)); // Rn
+    TmpInst.addOperand(MCOperand::CreateImm(-4));
+    TmpInst.addOperand(Inst.getOperand(2)); // CondCode
+    TmpInst.addOperand(Inst.getOperand(3));
+    Inst = TmpInst;
+    return true;
+  }
    case ARM::LDMIA_UPD:
      // If this is a load of a single register via a 'pop', then we should use
      // a post-indexed LDR instruction instead, per the ARM ARM.
@@ -4407,6 +4652,7 @@ processInstruction(MCInst &Inst,
        TmpInst.addOperand(Inst.getOperand(2)); // CondCode
        TmpInst.addOperand(Inst.getOperand(3));
        Inst = TmpInst;
+      return true;
      }
      break;
    case ARM::STMDB_UPD:
@@ -4430,36 +4676,48 @@ processInstruction(MCInst &Inst,
      // explicitly specified. From the ARM ARM: "Encoding T1 is preferred
      // to encoding T2 if <Rd> is specified and encoding T2 is preferred
      // to encoding T1 if <Rd> is omitted."
-    if (Inst.getOperand(3).getImm() < 8 && Operands.size() == 6)
+    if (Inst.getOperand(3).getImm() < 8 && Operands.size() == 6) {
        Inst.setOpcode(ARM::tADDi3);
+      return true;
+    }
      break;
    case ARM::tSUBi8:
      // If the immediate is in the range 0-7, we want tADDi3 iff Rd was
      // explicitly specified. From the ARM ARM: "Encoding T1 is preferred
      // to encoding T2 if <Rd> is specified and encoding T2 is preferred
      // to encoding T1 if <Rd> is omitted."
-    if (Inst.getOperand(3).getImm() < 8 && Operands.size() == 6)
+    if (Inst.getOperand(3).getImm() < 8 && Operands.size() == 6) {
        Inst.setOpcode(ARM::tSUBi3);
+      return true;
+    }
      break;
    case ARM::tB:
      // A Thumb conditional branch outside of an IT block is a tBcc.
-    if (Inst.getOperand(1).getImm() != ARMCC::AL && !inITBlock())
+    if (Inst.getOperand(1).getImm() != ARMCC::AL && !inITBlock()) {
        Inst.setOpcode(ARM::tBcc);
+      return true;
+    }
      break;
    case ARM::t2B:
      // A Thumb2 conditional branch outside of an IT block is a t2Bcc.
-    if (Inst.getOperand(1).getImm() != ARMCC::AL && !inITBlock())
+    if (Inst.getOperand(1).getImm() != ARMCC::AL && !inITBlock()){
        Inst.setOpcode(ARM::t2Bcc);
+      return true;
+    }
      break;
    case ARM::t2Bcc:
      // If the conditional is AL or we're in an IT block, we really want t2B.
-    if (Inst.getOperand(1).getImm() == ARMCC::AL || inITBlock())
+    if (Inst.getOperand(1).getImm() == ARMCC::AL || inITBlock()) {
        Inst.setOpcode(ARM::t2B);
+      return true;
+    }
      break;
    case ARM::tBcc:
      // If the conditional is AL, we really want tB.
-    if (Inst.getOperand(1).getImm() == ARMCC::AL)
+    if (Inst.getOperand(1).getImm() == ARMCC::AL) {
        Inst.setOpcode(ARM::tB);
+      return true;
+    }
      break;
    case ARM::tLDMIA: {
      // If the register list contains any high registers, or if the writeback
@@ -4482,6 +4740,7 @@ processInstruction(MCInst &Inst,
        if (hasWritebackToken)
          Inst.insert(Inst.begin(),
                      MCOperand::CreateReg(Inst.getOperand(0).getReg()));
+      return true;
      }
      break;
    }
@@ -4495,9 +4754,35 @@ processInstruction(MCInst &Inst,
        // 16-bit encoding isn't sufficient. Switch to the 32-bit version.
        assert (isThumbTwo());
        Inst.setOpcode(ARM::t2STMIA_UPD);
+      return true;
      }
      break;
    }
+  case ARM::tPOP: {
+    bool listContainsBase;
+    // If the register list contains any high registers, we need to use
+    // the 32-bit encoding instead if we're in Thumb2. Otherwise, this
+    // should have generated an error in validateInstruction().
+    if (!checkLowRegisterList(Inst, 2, 0, ARM::PC, listContainsBase))
+      return false;
+    assert (isThumbTwo());
+    Inst.setOpcode(ARM::t2LDMIA_UPD);
+    // Add the base register and writeback operands.
+    Inst.insert(Inst.begin(), MCOperand::CreateReg(ARM::SP));
+    Inst.insert(Inst.begin(), MCOperand::CreateReg(ARM::SP));
+    return true;
+  }
+  case ARM::tPUSH: {
+    bool listContainsBase;
+    if (!checkLowRegisterList(Inst, 2, 0, ARM::LR, listContainsBase))
+      return false;
+    assert (isThumbTwo());
+    Inst.setOpcode(ARM::t2STMDB_UPD);
+    // Add the base register and writeback operands.
+    Inst.insert(Inst.begin(), MCOperand::CreateReg(ARM::SP));
+    Inst.insert(Inst.begin(), MCOperand::CreateReg(ARM::SP));
+    return true;
+  }
    case ARM::t2MOVi: {
      // If we can use the 16-bit encoding and the user didn't explicitly
      // request the 32-bit variant, transform it here.
@@ -4517,6 +4802,7 @@ processInstruction(MCInst &Inst,
        TmpInst.addOperand(Inst.getOperand(2));
        TmpInst.addOperand(Inst.getOperand(3));
        Inst = TmpInst;
+      return true;
      }
      break;
    }
@@ -4537,6 +4823,7 @@ processInstruction(MCInst &Inst,
        TmpInst.addOperand(Inst.getOperand(2));
        TmpInst.addOperand(Inst.getOperand(3));
        Inst = TmpInst;
+      return true;
      }
      break;
    }
@@ -4567,6 +4854,7 @@ processInstruction(MCInst &Inst,
        TmpInst.addOperand(Inst.getOperand(3));
        TmpInst.addOperand(Inst.getOperand(4));
        Inst = TmpInst;
+      return true;
      }
      break;
    }
@@ -4599,13 +4887,14 @@ processInstruction(MCInst &Inst,
      break;
    }
    }
+  return false;
  }
  
  unsigned ARMAsmParser::checkTargetMatchPredicate(MCInst &Inst) {
    // 16-bit thumb arithmetic instructions either require or preclude the 'S'
    // suffix depending on whether they're in an IT block or not.
    unsigned Opc = Inst.getOpcode();
-  MCInstrDesc &MCID = getInstDesc(Opc);
+  const MCInstrDesc &MCID = getInstDesc(Opc);
    if (MCID.TSFlags & ARMII::ThumbArithFlagSetting) {
      assert(MCID.hasOptionalDef() &&
             "optionally flag setting instruction missing optional def operand");
@@ -4664,8 +4953,11 @@ MatchAndEmitInstruction(SMLoc IDLoc,
      }
  
      // Some instructions need post-processing to, for example, tweak which
-    // encoding is selected.
-    processInstruction(Inst, Operands);
+    // encoding is selected. Loop on it while changes happen so the
+    // individual transformations can chain off each other. E.g.,
+    // tPOP(r8)->t2LDMIA_UPD(sp,r8)->t2STR_POST(sp,r8)
+    while (processInstruction(Inst, Operands))
+      ;
  
      // Only move forward at the very end so that everything in validate
      // and process gets a consistent answer about whether we're in an IT
@@ -4775,17 +5067,17 @@ bool ARMAsmParser::parseDirectiveThumbFunc(SMLoc L) {
      const AsmToken &Tok = Parser.getTok();
      if (Tok.isNot(AsmToken::Identifier) && Tok.isNot(AsmToken::String))
        return Error(L, "unexpected token in .thumb_func directive");
-    Name = Tok.getString();
+    Name = Tok.getIdentifier();
      Parser.Lex(); // Consume the identifier token.
    }
  
-  if (getLexer().isNot(AsmToken::EndOfStatement))
+ if (getLexer().isNot(AsmToken::EndOfStatement))
      return Error(L, "unexpected token in directive");
    Parser.Lex();
  
    // FIXME: assuming function name will be the line following .thumb_func
    if (!isMachO) {
-    Name = Parser.getTok().getString();
+    Name = Parser.getTok().getIdentifier();
    }
  
    // Mark symbol as a thumb symbol.