ARM enclosing curly braces optional on one-register VLD/VST instruction lists.

[oota-llvm.git] / lib / Target / ARM / AsmParser / ARMAsmParser.cpp
diff --git a/lib/Target/ARM/AsmParser/ARMAsmParser.cpp b/lib/Target/ARM/AsmParser/ARMAsmParser.cpp

index e68ecec301a2fdbc7129b402108f3b6fc3315a82..1535a7a77683c68b1a7f68a1be69e9d29089955b 100644 (file)
--- a/lib/Target/ARM/AsmParser/ARMAsmParser.cpp
+++ b/lib/Target/ARM/AsmParser/ARMAsmParser.cpp
@@ -208,7 +208,7 @@ class ARMAsmParser : public MCTargetAsmParser {
  
    bool validateInstruction(MCInst &Inst,
                             const SmallVectorImpl<MCParsedAsmOperand*> &Ops);
-  void processInstruction(MCInst &Inst,
+  bool processInstruction(MCInst &Inst,
                            const SmallVectorImpl<MCParsedAsmOperand*> &Ops);
    bool shouldOmitCCOutOperand(StringRef Mnemonic,
                                SmallVectorImpl<MCParsedAsmOperand*> &Operands);
@@ -602,6 +602,14 @@ public:
      int64_t Value = CE->getValue();
      return Value > 0 && Value < 33;
    }
+  bool isImm0_32() const {
+    if (Kind != k_Immediate)
+      return false;
+    const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(getImm());
+    if (!CE) return false;
+    int64_t Value = CE->getValue();
+    return Value >= 0 && Value < 33;
+  }
    bool isImm0_65535() const {
      if (Kind != k_Immediate)
        return false;
@@ -706,7 +714,7 @@ public:
    bool isBitfield() const { return Kind == k_BitfieldDescriptor; }
    bool isPostIdxRegShifted() const { return Kind == k_PostIndexRegister; }
    bool isPostIdxReg() const {
-    return Kind == k_PostIndexRegister && PostIdxReg.ShiftTy == ARM_AM::no_shift;
+    return Kind == k_PostIndexRegister && PostIdxReg.ShiftTy ==ARM_AM::no_shift;
    }
    bool isMemNoOffset(bool alignOK = false) const {
      if (!isMemory())
@@ -1093,7 +1101,8 @@ public:
  
    void addRegShiftedRegOperands(MCInst &Inst, unsigned N) const {
      assert(N == 3 && "Invalid number of operands!");
-    assert(isRegShiftedReg() && "addRegShiftedRegOperands() on non RegShiftedReg!");
+    assert(isRegShiftedReg() &&
+           "addRegShiftedRegOperands() on non RegShiftedReg!");
      Inst.addOperand(MCOperand::CreateReg(RegShiftedReg.SrcReg));
      Inst.addOperand(MCOperand::CreateReg(RegShiftedReg.ShiftReg));
      Inst.addOperand(MCOperand::CreateImm(
@@ -1102,7 +1111,8 @@ public:
  
    void addRegShiftedImmOperands(MCInst &Inst, unsigned N) const {
      assert(N == 2 && "Invalid number of operands!");
-    assert(isRegShiftedImm() && "addRegShiftedImmOperands() on non RegShiftedImm!");
+    assert(isRegShiftedImm() &&
+           "addRegShiftedImmOperands() on non RegShiftedImm!");
      Inst.addOperand(MCOperand::CreateReg(RegShiftedImm.SrcReg));
      Inst.addOperand(MCOperand::CreateImm(
        ARM_AM::getSORegOpc(RegShiftedImm.ShiftTy, RegShiftedImm.ShiftImm)));
@@ -1181,26 +1191,6 @@ public:
      Inst.addOperand(MCOperand::CreateImm(CE->getValue() / 4));
    }
  
-  void addImm0_255Operands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
-  void addImm0_7Operands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
-  void addImm0_15Operands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
-  void addImm0_31Operands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
    void addImm1_16Operands(MCInst &Inst, unsigned N) const {
      assert(N == 1 && "Invalid number of operands!");
      // The constant encodes as the immediate-1, and we store in the instruction
@@ -1217,21 +1207,6 @@ public:
      Inst.addOperand(MCOperand::CreateImm(CE->getValue() - 1));
    }
  
-  void addImm0_65535Operands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
-  void addImm0_65535ExprOperands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
-  void addImm24bitOperands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
    void addImmThumbSROperands(MCInst &Inst, unsigned N) const {
      assert(N == 1 && "Invalid number of operands!");
      // The constant encodes as the immediate, except for 32, which encodes as
@@ -1241,11 +1216,6 @@ public:
      Inst.addOperand(MCOperand::CreateImm((Imm == 32 ? 0 : Imm)));
    }
  
-  void addPKHLSLImmOperands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
    void addPKHASRImmOperands(MCInst &Inst, unsigned N) const {
      assert(N == 1 && "Invalid number of operands!");
      // An ASR value of 32 encodes as 0, so that's how we want to add it to
@@ -1255,16 +1225,6 @@ public:
      Inst.addOperand(MCOperand::CreateImm(Val == 32 ? 0 : Val));
    }
  
-  void addARMSOImmOperands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
-  void addT2SOImmOperands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
    void addT2SOImmNotOperands(MCInst &Inst, unsigned N) const {
      assert(N == 1 && "Invalid number of operands!");
      // The operand is actually a t2_so_imm, but we have its bitwise
@@ -1281,11 +1241,6 @@ public:
      Inst.addOperand(MCOperand::CreateImm(~CE->getValue()));
    }
  
-  void addSetEndImmOperands(MCInst &Inst, unsigned N) const {
-    assert(N == 1 && "Invalid number of operands!");
-    addExpr(Inst, getImm());
-  }
-
    void addMemBarrierOptOperands(MCInst &Inst, unsigned N) const {
      assert(N == 1 && "Invalid number of operands!");
      Inst.addOperand(MCOperand::CreateImm(unsigned(getMemBarrierOpt())));
@@ -1473,8 +1428,9 @@ public:
  
    void addMemRegOffsetOperands(MCInst &Inst, unsigned N) const {
      assert(N == 3 && "Invalid number of operands!");
-    unsigned Val = ARM_AM::getAM2Opc(Memory.isNegative ? ARM_AM::sub : ARM_AM::add,
-                                     Memory.ShiftImm, Memory.ShiftType);
+    unsigned Val =
+      ARM_AM::getAM2Opc(Memory.isNegative ? ARM_AM::sub : ARM_AM::add,
+                        Memory.ShiftImm, Memory.ShiftType);
      Inst.addOperand(MCOperand::CreateReg(Memory.BaseRegNum));
      Inst.addOperand(MCOperand::CreateReg(Memory.OffsetRegNum));
      Inst.addOperand(MCOperand::CreateImm(Val));
@@ -2397,6 +2353,29 @@ static unsigned getNextRegister(unsigned Reg) {
    }
  }
  
+// Return the low-subreg of a given Q register.
+static unsigned getDRegFromQReg(unsigned QReg) {
+  switch (QReg) {
+  default: llvm_unreachable("expected a Q register!");
+  case ARM::Q0:  return ARM::D0;
+  case ARM::Q1:  return ARM::D2;
+  case ARM::Q2:  return ARM::D4;
+  case ARM::Q3:  return ARM::D6;
+  case ARM::Q4:  return ARM::D8;
+  case ARM::Q5:  return ARM::D10;
+  case ARM::Q6:  return ARM::D12;
+  case ARM::Q7:  return ARM::D14;
+  case ARM::Q8:  return ARM::D16;
+  case ARM::Q9:  return ARM::D18;
+  case ARM::Q10: return ARM::D20;
+  case ARM::Q11: return ARM::D22;
+  case ARM::Q12: return ARM::D24;
+  case ARM::Q13: return ARM::D26;
+  case ARM::Q14: return ARM::D28;
+  case ARM::Q15: return ARM::D30;
+  }
+}
+
  /// Parse a register list.
  bool ARMAsmParser::
  parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
@@ -2412,6 +2391,16 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
    if (Reg == -1)
      return Error(RegLoc, "register expected");
  
+  // The reglist instructions have at most 16 registers, so reserve
+  // space for that many.
+  SmallVector<std::pair<unsigned, SMLoc>, 16> Registers;
+
+  // Allow Q regs and just interpret them as the two D sub-registers.
+  if (ARMMCRegisterClasses[ARM::QPRRegClassID].contains(Reg)) {
+    Reg = getDRegFromQReg(Reg);
+    Registers.push_back(std::pair<unsigned, SMLoc>(Reg, RegLoc));
+    ++Reg;
+  }
    const MCRegisterClass *RC;
    if (ARMMCRegisterClasses[ARM::GPRRegClassID].contains(Reg))
      RC = &ARMMCRegisterClasses[ARM::GPRRegClassID];
@@ -2422,10 +2411,7 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
    else
      return Error(RegLoc, "invalid register in register list");
  
-  // The reglist instructions have at most 16 registers, so reserve
-  // space for that many.
-  SmallVector<std::pair<unsigned, SMLoc>, 16> Registers;
-  // Store the first register.
+  // Store the register.
    Registers.push_back(std::pair<unsigned, SMLoc>(Reg, RegLoc));
  
    // This starts immediately after the first register token in the list,
@@ -2439,6 +2425,9 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
        int EndReg = tryParseRegister();
        if (EndReg == -1)
          return Error(EndLoc, "register expected");
+      // Allow Q regs and just interpret them as the two D sub-registers.
+      if (ARMMCRegisterClasses[ARM::QPRRegClassID].contains(EndReg))
+        EndReg = getDRegFromQReg(EndReg) + 1;
        // If the register is the same as the start reg, there's nothing
        // more to do.
        if (Reg == EndReg)
@@ -2463,6 +2452,12 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
      Reg = tryParseRegister();
      if (Reg == -1)
        return Error(RegLoc, "register expected");
+    // Allow Q regs and just interpret them as the two D sub-registers.
+    bool isQReg = false;
+    if (ARMMCRegisterClasses[ARM::QPRRegClassID].contains(Reg)) {
+      Reg = getDRegFromQReg(Reg);
+      isQReg = true;
+    }
      // The register must be in the same register class as the first.
      if (!RC->contains(Reg))
        return Error(RegLoc, "invalid register in register list");
@@ -2476,6 +2471,8 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
          Reg != OldReg + 1)
        return Error(RegLoc, "non-contiguous register range");
      Registers.push_back(std::pair<unsigned, SMLoc>(Reg, RegLoc));
+    if (isQReg)
+      Registers.push_back(std::pair<unsigned, SMLoc>(++Reg, RegLoc));
    }
  
    SMLoc E = Parser.getTok().getLoc();
@@ -2487,36 +2484,34 @@ parseRegisterList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
    return false;
  }
  
-// Return the low-subreg of a given Q register.
-static unsigned getDRegFromQReg(unsigned QReg) {
-  switch (QReg) {
-  default: llvm_unreachable("expected a Q register!");
-  case ARM::Q0:  return ARM::D0;
-  case ARM::Q1:  return ARM::D2;
-  case ARM::Q2:  return ARM::D4;
-  case ARM::Q3:  return ARM::D6;
-  case ARM::Q4:  return ARM::D8;
-  case ARM::Q5:  return ARM::D10;
-  case ARM::Q6:  return ARM::D12;
-  case ARM::Q7:  return ARM::D14;
-  case ARM::Q8:  return ARM::D16;
-  case ARM::Q9:  return ARM::D19;
-  case ARM::Q10: return ARM::D20;
-  case ARM::Q11: return ARM::D22;
-  case ARM::Q12: return ARM::D24;
-  case ARM::Q13: return ARM::D26;
-  case ARM::Q14: return ARM::D28;
-  case ARM::Q15: return ARM::D30;
-  }
-}
-
  // parse a vector register list
  ARMAsmParser::OperandMatchResultTy ARMAsmParser::
  parseVectorList(SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
-  if(Parser.getTok().isNot(AsmToken::LCurly))
+  SMLoc S = Parser.getTok().getLoc();
+  // As an extension (to match gas), support a plain D register or Q register
+  // (without encosing curly braces) as a single or double entry list,
+  // respectively.
+  if (Parser.getTok().is(AsmToken::Identifier)) {
+    int Reg = tryParseRegister();
+    if (Reg == -1)
+      return MatchOperand_NoMatch;
+    SMLoc E = Parser.getTok().getLoc();
+    if (ARMMCRegisterClasses[ARM::DPRRegClassID].contains(Reg)) {
+      Operands.push_back(ARMOperand::CreateVectorList(Reg, 1, S, E));
+      return MatchOperand_Success;
+    }
+    if (ARMMCRegisterClasses[ARM::QPRRegClassID].contains(Reg)) {
+      Reg = getDRegFromQReg(Reg);
+      Operands.push_back(ARMOperand::CreateVectorList(Reg, 2, S, E));
+      return MatchOperand_Success;
+    }
+    Error(S, "vector register expected");
+    return MatchOperand_ParseFail;
+  }
+
+  if (Parser.getTok().isNot(AsmToken::LCurly))
      return MatchOperand_NoMatch;
  
-  SMLoc S = Parser.getTok().getLoc();
    Parser.Lex(); // Eat '{' token.
    SMLoc RegLoc = Parser.getTok().getLoc();
  
@@ -3402,13 +3397,15 @@ cvtThumbMultiply(MCInst &Inst, unsigned Opcode,
    }
    ((ARMOperand*)Operands[3])->addRegOperands(Inst, 1);
    ((ARMOperand*)Operands[1])->addCCOutOperands(Inst, 1);
-  ((ARMOperand*)Operands[4])->addRegOperands(Inst, 1);
-  // If we have a three-operand form, use that, else the second source operand
-  // is just the destination operand again.
-  if (Operands.size() == 6)
-    ((ARMOperand*)Operands[5])->addRegOperands(Inst, 1);
-  else
-    Inst.addOperand(Inst.getOperand(0));
+  // If we have a three-operand form, make sure to set Rn to be the operand
+  // that isn't the same as Rd.
+  unsigned RegOp = 4;
+  if (Operands.size() == 6 &&
+      ((ARMOperand*)Operands[4])->getReg() ==
+        ((ARMOperand*)Operands[3])->getReg())
+    RegOp = 5;
+  ((ARMOperand*)Operands[RegOp])->addRegOperands(Inst, 1);
+  Inst.addOperand(Inst.getOperand(0));
    ((ARMOperand*)Operands[2])->addCondCodeOperands(Inst, 2);
  
    return true;
@@ -4122,6 +4119,7 @@ bool ARMAsmParser::shouldOmitCCOutOperand(StringRef Mnemonic,
        // remove the cc_out operand.
        (!isARMLowRegister(static_cast<ARMOperand*>(Operands[3])->getReg()) ||
         !isARMLowRegister(static_cast<ARMOperand*>(Operands[4])->getReg()) ||
+       !isARMLowRegister(static_cast<ARMOperand*>(Operands[5])->getReg()) ||
         !inITBlock() ||
         (static_cast<ARMOperand*>(Operands[3])->getReg() !=
          static_cast<ARMOperand*>(Operands[5])->getReg() &&
@@ -4129,6 +4127,20 @@ bool ARMAsmParser::shouldOmitCCOutOperand(StringRef Mnemonic,
          static_cast<ARMOperand*>(Operands[4])->getReg())))
      return true;
  
+  // Also check the 'mul' syntax variant that doesn't specify an explicit
+  // destination register.
+  if (isThumbTwo() && Mnemonic == "mul" && Operands.size() == 5 &&
+      static_cast<ARMOperand*>(Operands[1])->getReg() == 0 &&
+      static_cast<ARMOperand*>(Operands[3])->isReg() &&
+      static_cast<ARMOperand*>(Operands[4])->isReg() &&
+      // If the registers aren't low regs  or the cc_out operand is zero
+      // outside of an IT block, we have to use the 32-bit encoding, so
+      // remove the cc_out operand.
+      (!isARMLowRegister(static_cast<ARMOperand*>(Operands[3])->getReg()) ||
+       !isARMLowRegister(static_cast<ARMOperand*>(Operands[4])->getReg()) ||
+       !inITBlock()))
+    return true;
+
  
  
    // Register-register 'add/sub' for thumb does not have a cc_out operand
@@ -4146,6 +4158,22 @@ bool ARMAsmParser::shouldOmitCCOutOperand(StringRef Mnemonic,
    return false;
  }
  
+static bool isDataTypeToken(StringRef Tok) {
+  return Tok == ".8" || Tok == ".16" || Tok == ".32" || Tok == ".64" ||
+    Tok == ".i8" || Tok == ".i16" || Tok == ".i32" || Tok == ".i64" ||
+    Tok == ".u8" || Tok == ".u16" || Tok == ".u32" || Tok == ".u64" ||
+    Tok == ".s8" || Tok == ".s16" || Tok == ".s32" || Tok == ".s64" ||
+    Tok == ".p8" || Tok == ".p16" || Tok == ".f32" || Tok == ".f64" ||
+    Tok == ".f" || Tok == ".d";
+}
+
+// FIXME: This bit should probably be handled via an explicit match class
+// in the .td files that matches the suffix instead of having it be
+// a literal string token the way it is now.
+static bool doesIgnoreDataTypeSuffix(StringRef Mnemonic, StringRef DT) {
+  return Mnemonic.startswith("vldm") || Mnemonic.startswith("vstm");
+}
+
  /// Parse an arm instruction mnemonic followed by its operands.
  bool ARMAsmParser::ParseInstruction(StringRef Name, SMLoc NameLoc,
                                 SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
@@ -4250,9 +4278,12 @@ bool ARMAsmParser::ParseInstruction(StringRef Name, SMLoc NameLoc,
      Next = Name.find('.', Start + 1);
      StringRef ExtraToken = Name.slice(Start, Next);
  
-    // For now, we're only parsing Thumb1 (for the most part), so
-    // just ignore ".n" qualifiers. We'll use them to restrict
-    // matching when we do Thumb2.
+    // Some NEON instructions have an optional datatype suffix that is
+    // completely ignored. Check for that.
+    if (isDataTypeToken(ExtraToken) &&
+        doesIgnoreDataTypeSuffix(Mnemonic, ExtraToken))
+      continue;
+
      if (ExtraToken != ".n") {
        SMLoc Loc = SMLoc::getFromPointer(NameLoc.getPointer() + Start);
        Operands.push_back(ARMOperand::CreateToken(ExtraToken, Loc));
@@ -4511,16 +4542,21 @@ validateInstruction(MCInst &Inst,
                     "in register list");
      break;
    }
+  // Like for ldm/stm, push and pop have hi-reg handling version in Thumb2,
+  // so only issue a diagnostic for thumb1. The instructions will be
+  // switched to the t2 encodings in processInstruction() if necessary.
    case ARM::tPOP: {
      bool listContainsBase;
-    if (checkLowRegisterList(Inst, 3, 0, ARM::PC, listContainsBase))
+    if (checkLowRegisterList(Inst, 2, 0, ARM::PC, listContainsBase) &&
+        !isThumbTwo())
        return Error(Operands[2]->getStartLoc(),
                     "registers must be in range r0-r7 or pc");
      break;
    }
    case ARM::tPUSH: {
      bool listContainsBase;
-    if (checkLowRegisterList(Inst, 3, 0, ARM::LR, listContainsBase))
+    if (checkLowRegisterList(Inst, 2, 0, ARM::LR, listContainsBase) &&
+        !isThumbTwo())
        return Error(Operands[2]->getStartLoc(),
                     "registers must be in range r0-r7 or lr");
      break;
@@ -4537,24 +4573,70 @@ validateInstruction(MCInst &Inst,
    return false;
  }
  
-void ARMAsmParser::
+bool ARMAsmParser::
  processInstruction(MCInst &Inst,
                     const SmallVectorImpl<MCParsedAsmOperand*> &Operands) {
    switch (Inst.getOpcode()) {
    // Handle the MOV complex aliases.
-  case ARM::ASRi: {
-    unsigned Amt = Inst.getOperand(2).getImm() + 1;
-    unsigned ShiftOp = ARM_AM::getSORegOpc(ARM_AM::asr, Amt);
+  case ARM::ASRi:
+  case ARM::LSRi:
+  case ARM::LSLi:
+  case ARM::RORi: {
+    ARM_AM::ShiftOpc ShiftTy;
+    unsigned Amt = Inst.getOperand(2).getImm();
+    switch(Inst.getOpcode()) {
+    default: llvm_unreachable("unexpected opcode!");
+    case ARM::ASRi: ShiftTy = ARM_AM::asr; break;
+    case ARM::LSRi: ShiftTy = ARM_AM::lsr; break;
+    case ARM::LSLi: ShiftTy = ARM_AM::lsl; break;
+    case ARM::RORi: ShiftTy = ARM_AM::ror; break;
+    }
+    // A shift by zero is a plain MOVr, not a MOVsi.
+    unsigned Opc = Amt == 0 ? ARM::MOVr : ARM::MOVsi;
+    unsigned Shifter = ARM_AM::getSORegOpc(ShiftTy, Amt);
      MCInst TmpInst;
-    TmpInst.setOpcode(ARM::MOVsi);
+    TmpInst.setOpcode(Opc);
      TmpInst.addOperand(Inst.getOperand(0)); // Rd
      TmpInst.addOperand(Inst.getOperand(1)); // Rn
-    TmpInst.addOperand(MCOperand::CreateImm(ShiftOp)); // Shift value and ty
+    if (Opc == ARM::MOVsi)
+      TmpInst.addOperand(MCOperand::CreateImm(Shifter)); // Shift value and ty
      TmpInst.addOperand(Inst.getOperand(3)); // CondCode
      TmpInst.addOperand(Inst.getOperand(4));
      TmpInst.addOperand(Inst.getOperand(5)); // cc_out
      Inst = TmpInst;
-    break;
+    return true;
+  }
+  case ARM::t2LDMIA_UPD: {
+    // If this is a load of a single register, then we should use
+    // a post-indexed LDR instruction instead, per the ARM ARM.
+    if (Inst.getNumOperands() != 5)
+      return false;
+    MCInst TmpInst;
+    TmpInst.setOpcode(ARM::t2LDR_POST);
+    TmpInst.addOperand(Inst.getOperand(4)); // Rt
+    TmpInst.addOperand(Inst.getOperand(0)); // Rn_wb
+    TmpInst.addOperand(Inst.getOperand(1)); // Rn
+    TmpInst.addOperand(MCOperand::CreateImm(4));
+    TmpInst.addOperand(Inst.getOperand(2)); // CondCode
+    TmpInst.addOperand(Inst.getOperand(3));
+    Inst = TmpInst;
+    return true;
+  }
+  case ARM::t2STMDB_UPD: {
+    // If this is a store of a single register, then we should use
+    // a pre-indexed STR instruction instead, per the ARM ARM.
+    if (Inst.getNumOperands() != 5)
+      return false;
+    MCInst TmpInst;
+    TmpInst.setOpcode(ARM::t2STR_PRE);
+    TmpInst.addOperand(Inst.getOperand(0)); // Rn_wb
+    TmpInst.addOperand(Inst.getOperand(4)); // Rt
+    TmpInst.addOperand(Inst.getOperand(1)); // Rn
+    TmpInst.addOperand(MCOperand::CreateImm(-4));
+    TmpInst.addOperand(Inst.getOperand(2)); // CondCode
+    TmpInst.addOperand(Inst.getOperand(3));
+    Inst = TmpInst;
+    return true;
    }
    case ARM::LDMIA_UPD:
      // If this is a load of a single register via a 'pop', then we should use
@@ -4571,6 +4653,7 @@ processInstruction(MCInst &Inst,
        TmpInst.addOperand(Inst.getOperand(2)); // CondCode
        TmpInst.addOperand(Inst.getOperand(3));
        Inst = TmpInst;
+      return true;
      }
      break;
    case ARM::STMDB_UPD:
@@ -4594,36 +4677,48 @@ processInstruction(MCInst &Inst,
      // explicitly specified. From the ARM ARM: "Encoding T1 is preferred
      // to encoding T2 if <Rd> is specified and encoding T2 is preferred
      // to encoding T1 if <Rd> is omitted."
-    if (Inst.getOperand(3).getImm() < 8 && Operands.size() == 6)
+    if (Inst.getOperand(3).getImm() < 8 && Operands.size() == 6) {
        Inst.setOpcode(ARM::tADDi3);
+      return true;
+    }
      break;
    case ARM::tSUBi8:
      // If the immediate is in the range 0-7, we want tADDi3 iff Rd was
      // explicitly specified. From the ARM ARM: "Encoding T1 is preferred
      // to encoding T2 if <Rd> is specified and encoding T2 is preferred
      // to encoding T1 if <Rd> is omitted."
-    if (Inst.getOperand(3).getImm() < 8 && Operands.size() == 6)
+    if (Inst.getOperand(3).getImm() < 8 && Operands.size() == 6) {
        Inst.setOpcode(ARM::tSUBi3);
+      return true;
+    }
      break;
    case ARM::tB:
      // A Thumb conditional branch outside of an IT block is a tBcc.
-    if (Inst.getOperand(1).getImm() != ARMCC::AL && !inITBlock())
+    if (Inst.getOperand(1).getImm() != ARMCC::AL && !inITBlock()) {
        Inst.setOpcode(ARM::tBcc);
+      return true;
+    }
      break;
    case ARM::t2B:
      // A Thumb2 conditional branch outside of an IT block is a t2Bcc.
-    if (Inst.getOperand(1).getImm() != ARMCC::AL && !inITBlock())
+    if (Inst.getOperand(1).getImm() != ARMCC::AL && !inITBlock()){
        Inst.setOpcode(ARM::t2Bcc);
+      return true;
+    }
      break;
    case ARM::t2Bcc:
      // If the conditional is AL or we're in an IT block, we really want t2B.
-    if (Inst.getOperand(1).getImm() == ARMCC::AL || inITBlock())
+    if (Inst.getOperand(1).getImm() == ARMCC::AL || inITBlock()) {
        Inst.setOpcode(ARM::t2B);
+      return true;
+    }
      break;
    case ARM::tBcc:
      // If the conditional is AL, we really want tB.
-    if (Inst.getOperand(1).getImm() == ARMCC::AL)
+    if (Inst.getOperand(1).getImm() == ARMCC::AL) {
        Inst.setOpcode(ARM::tB);
+      return true;
+    }
      break;
    case ARM::tLDMIA: {
      // If the register list contains any high registers, or if the writeback
@@ -4646,6 +4741,7 @@ processInstruction(MCInst &Inst,
        if (hasWritebackToken)
          Inst.insert(Inst.begin(),
                      MCOperand::CreateReg(Inst.getOperand(0).getReg()));
+      return true;
      }
      break;
    }
@@ -4659,9 +4755,35 @@ processInstruction(MCInst &Inst,
        // 16-bit encoding isn't sufficient. Switch to the 32-bit version.
        assert (isThumbTwo());
        Inst.setOpcode(ARM::t2STMIA_UPD);
+      return true;
      }
      break;
    }
+  case ARM::tPOP: {
+    bool listContainsBase;
+    // If the register list contains any high registers, we need to use
+    // the 32-bit encoding instead if we're in Thumb2. Otherwise, this
+    // should have generated an error in validateInstruction().
+    if (!checkLowRegisterList(Inst, 2, 0, ARM::PC, listContainsBase))
+      return false;
+    assert (isThumbTwo());
+    Inst.setOpcode(ARM::t2LDMIA_UPD);
+    // Add the base register and writeback operands.
+    Inst.insert(Inst.begin(), MCOperand::CreateReg(ARM::SP));
+    Inst.insert(Inst.begin(), MCOperand::CreateReg(ARM::SP));
+    return true;
+  }
+  case ARM::tPUSH: {
+    bool listContainsBase;
+    if (!checkLowRegisterList(Inst, 2, 0, ARM::LR, listContainsBase))
+      return false;
+    assert (isThumbTwo());
+    Inst.setOpcode(ARM::t2STMDB_UPD);
+    // Add the base register and writeback operands.
+    Inst.insert(Inst.begin(), MCOperand::CreateReg(ARM::SP));
+    Inst.insert(Inst.begin(), MCOperand::CreateReg(ARM::SP));
+    return true;
+  }
    case ARM::t2MOVi: {
      // If we can use the 16-bit encoding and the user didn't explicitly
      // request the 32-bit variant, transform it here.
@@ -4681,6 +4803,7 @@ processInstruction(MCInst &Inst,
        TmpInst.addOperand(Inst.getOperand(2));
        TmpInst.addOperand(Inst.getOperand(3));
        Inst = TmpInst;
+      return true;
      }
      break;
    }
@@ -4701,6 +4824,7 @@ processInstruction(MCInst &Inst,
        TmpInst.addOperand(Inst.getOperand(2));
        TmpInst.addOperand(Inst.getOperand(3));
        Inst = TmpInst;
+      return true;
      }
      break;
    }
@@ -4731,6 +4855,7 @@ processInstruction(MCInst &Inst,
        TmpInst.addOperand(Inst.getOperand(3));
        TmpInst.addOperand(Inst.getOperand(4));
        Inst = TmpInst;
+      return true;
      }
      break;
    }
@@ -4763,6 +4888,7 @@ processInstruction(MCInst &Inst,
      break;
    }
    }
+  return false;
  }
  
  unsigned ARMAsmParser::checkTargetMatchPredicate(MCInst &Inst) {
@@ -4828,8 +4954,11 @@ MatchAndEmitInstruction(SMLoc IDLoc,
      }
  
      // Some instructions need post-processing to, for example, tweak which
-    // encoding is selected.
-    processInstruction(Inst, Operands);
+    // encoding is selected. Loop on it while changes happen so the
+    // individual transformations can chain off each other. E.g.,
+    // tPOP(r8)->t2LDMIA_UPD(sp,r8)->t2STR_POST(sp,r8)
+    while (processInstruction(Inst, Operands))
+      ;
  
      // Only move forward at the very end so that everything in validate
      // and process gets a consistent answer about whether we're in an IT
@@ -4939,17 +5068,17 @@ bool ARMAsmParser::parseDirectiveThumbFunc(SMLoc L) {
      const AsmToken &Tok = Parser.getTok();
      if (Tok.isNot(AsmToken::Identifier) && Tok.isNot(AsmToken::String))
        return Error(L, "unexpected token in .thumb_func directive");
-    Name = Tok.getString();
+    Name = Tok.getIdentifier();
      Parser.Lex(); // Consume the identifier token.
    }
  
-  if (getLexer().isNot(AsmToken::EndOfStatement))
+ if (getLexer().isNot(AsmToken::EndOfStatement))
      return Error(L, "unexpected token in directive");
    Parser.Lex();
  
    // FIXME: assuming function name will be the line following .thumb_func
    if (!isMachO) {
-    Name = Parser.getTok().getString();
+    Name = Parser.getTok().getIdentifier();
    }
  
    // Mark symbol as a thumb symbol.