src/arm/disasm-arm.cc - platform/external/v8 - Git at Google

 // Copyright 2010 the V8 project authors. All rights reserved.
 // Redistribution and use in source and binary forms, with or without
 // modification, are permitted provided that the following conditions are
 // met:
 //
 //     * Redistributions of source code must retain the above copyright
 //       notice, this list of conditions and the following disclaimer.
 //     * Redistributions in binary form must reproduce the above
 //       copyright notice, this list of conditions and the following
 //       disclaimer in the documentation and/or other materials provided
 //       with the distribution.
 //     * Neither the name of Google Inc. nor the names of its
 //       contributors may be used to endorse or promote products derived
 //       from this software without specific prior written permission.
 //
 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 // A Disassembler object is used to disassemble a block of code instruction by
 // instruction. The default implementation of the NameConverter object can be
 // overriden to modify register names or to do symbol lookup on addresses.
 //
 // The example below will disassemble a block of code and print it to stdout.
 //
 //   NameConverter converter;
 //   Disassembler d(converter);
 //   for (byte* pc = begin; pc < end;) {
 //     char buffer[128];
 //     buffer[0] = '\0';
 //     byte* prev_pc = pc;
 //     pc += d.InstructionDecode(buffer, sizeof buffer, pc);
 //     printf("%p    %08x      %s\n",
 //            prev_pc, *reinterpret_cast<int32_t*>(prev_pc), buffer);
 //   }
 //
 // The Disassembler class also has a convenience method to disassemble a block
 // of code into a FILE*, meaning that the above functionality could also be
 // achieved by just calling Disassembler::Disassemble(stdout, begin, end);


 #include <assert.h>
 #include <stdio.h>
 #include <stdarg.h>
 #include <string.h>
 #ifndef WIN32
 #include <stdint.h>
 #endif

 #include "v8.h"

 #include "constants-arm.h"
 #include "disasm.h"
 #include "macro-assembler.h"
 #include "platform.h"


 namespace assembler {
 namespace arm {

 namespace v8i = v8::internal;


 //------------------------------------------------------------------------------

 // Decoder decodes and disassembles instructions into an output buffer.
 // It uses the converter to convert register names and call destinations into
 // more informative description.
 class Decoder {
  public:
   Decoder(const disasm::NameConverter& converter,
           v8::internal::Vector<char> out_buffer)
     : converter_(converter),
       out_buffer_(out_buffer),
       out_buffer_pos_(0) {
     out_buffer_[out_buffer_pos_] = '\0';
   }

   ~Decoder() {}

   // Writes one disassembled instruction into 'buffer' (0-terminated).
   // Returns the length of the disassembled machine instruction in bytes.
   int InstructionDecode(byte* instruction);

  private:
   // Bottleneck functions to print into the out_buffer.
   void PrintChar(const char ch);
   void Print(const char* str);

   // Printing of common values.
   void PrintRegister(int reg);
   void PrintSRegister(int reg);
   void PrintDRegister(int reg);
   int FormatVFPRegister(Instr* instr, const char* format);
   int FormatVFPinstruction(Instr* instr, const char* format);
   void PrintCondition(Instr* instr);
   void PrintShiftRm(Instr* instr);
   void PrintShiftImm(Instr* instr);
   void PrintPU(Instr* instr);
   void PrintSoftwareInterrupt(SoftwareInterruptCodes swi);

   // Handle formatting of instructions and their options.
   int FormatRegister(Instr* instr, const char* option);
   int FormatOption(Instr* instr, const char* option);
   void Format(Instr* instr, const char* format);
   void Unknown(Instr* instr);

   // Each of these functions decodes one particular instruction type, a 3-bit
   // field in the instruction encoding.
   // Types 0 and 1 are combined as they are largely the same except for the way
   // they interpret the shifter operand.
   void DecodeType01(Instr* instr);
   void DecodeType2(Instr* instr);
   void DecodeType3(Instr* instr);
   void DecodeType4(Instr* instr);
   void DecodeType5(Instr* instr);
   void DecodeType6(Instr* instr);
   void DecodeType7(Instr* instr);
   void DecodeUnconditional(Instr* instr);
   // For VFP support.
   void DecodeTypeVFP(Instr* instr);
   void DecodeType6CoprocessorIns(Instr* instr);


   const disasm::NameConverter& converter_;
   v8::internal::Vector<char> out_buffer_;
   int out_buffer_pos_;

   DISALLOW_COPY_AND_ASSIGN(Decoder);
 };


 // Support for assertions in the Decoder formatting functions.
 #define STRING_STARTS_WITH(string, compare_string) \
   (strncmp(string, compare_string, strlen(compare_string)) == 0)


 // Append the ch to the output buffer.
 void Decoder::PrintChar(const char ch) {
   out_buffer_[out_buffer_pos_++] = ch;
 }


 // Append the str to the output buffer.
 void Decoder::Print(const char* str) {
   char cur = *str++;
   while (cur != '\0' && (out_buffer_pos_ < (out_buffer_.length() - 1))) {
     PrintChar(cur);
     cur = *str++;
   }
   out_buffer_[out_buffer_pos_] = 0;
 }


 // These condition names are defined in a way to match the native disassembler
 // formatting. See for example the command "objdump -d <binary file>".
 static const char* cond_names[max_condition] = {
   "eq", "ne", "cs" , "cc" , "mi" , "pl" , "vs" , "vc" ,
   "hi", "ls", "ge", "lt", "gt", "le", "", "invalid",
 };


 // Print the condition guarding the instruction.
 void Decoder::PrintCondition(Instr* instr) {
   Print(cond_names[instr->ConditionField()]);
 }


 // Print the register name according to the active name converter.
 void Decoder::PrintRegister(int reg) {
   Print(converter_.NameOfCPURegister(reg));
 }

 // Print the VFP S register name according to the active name converter.
 void Decoder::PrintSRegister(int reg) {
   Print(assembler::arm::VFPRegisters::Name(reg));
 }

 // Print the  VFP D register name according to the active name converter.
 void Decoder::PrintDRegister(int reg) {
   Print(assembler::arm::VFPRegisters::Name(reg + 32));
 }


 // These shift names are defined in a way to match the native disassembler
 // formatting. See for example the command "objdump -d <binary file>".
 static const char* shift_names[max_shift] = {
   "lsl", "lsr", "asr", "ror"
 };


 // Print the register shift operands for the instruction. Generally used for
 // data processing instructions.
 void Decoder::PrintShiftRm(Instr* instr) {
   Shift shift = instr->ShiftField();
   int shift_amount = instr->ShiftAmountField();
   int rm = instr->RmField();

   PrintRegister(rm);

   if ((instr->RegShiftField() == 0) && (shift == LSL) && (shift_amount == 0)) {
     // Special case for using rm only.
     return;
   }
   if (instr->RegShiftField() == 0) {
     // by immediate
     if ((shift == ROR) && (shift_amount == 0)) {
       Print(", RRX");
       return;
     } else if (((shift == LSR) || (shift == ASR)) && (shift_amount == 0)) {
       shift_amount = 32;
     }
     out_buffer_pos_ += v8i::OS::SNPrintF(out_buffer_ + out_buffer_pos_,
                                          ", %s #%d",
                                          shift_names[shift], shift_amount);
   } else {
     // by register
     int rs = instr->RsField();
     out_buffer_pos_ += v8i::OS::SNPrintF(out_buffer_ + out_buffer_pos_,
                                          ", %s ", shift_names[shift]);
     PrintRegister(rs);
   }
 }


 // Print the immediate operand for the instruction. Generally used for data
 // processing instructions.
 void Decoder::PrintShiftImm(Instr* instr) {
   int rotate = instr->RotateField() * 2;
   int immed8 = instr->Immed8Field();
   int imm = (immed8 >> rotate) | (immed8 << (32 - rotate));
   out_buffer_pos_ += v8i::OS::SNPrintF(out_buffer_ + out_buffer_pos_,
                                        "#%d", imm);
 }


 // Print PU formatting to reduce complexity of FormatOption.
 void Decoder::PrintPU(Instr* instr) {
   switch (instr->PUField()) {
     case 0: {
       Print("da");
       break;
     }
     case 1: {
       Print("ia");
       break;
     }
     case 2: {
       Print("db");
       break;
     }
     case 3: {
       Print("ib");
       break;
     }
     default: {
       UNREACHABLE();
       break;
     }
   }
 }


 // Print SoftwareInterrupt codes. Factoring this out reduces the complexity of
 // the FormatOption method.
 void Decoder::PrintSoftwareInterrupt(SoftwareInterruptCodes swi) {
   switch (swi) {
     case call_rt_redirected:
       Print("call_rt_redirected");
       return;
     case break_point:
       Print("break_point");
       return;
     default:
       out_buffer_pos_ += v8i::OS::SNPrintF(out_buffer_ + out_buffer_pos_,
                                            "%d",
                                            swi);
       return;
   }
 }


 // Handle all register based formatting in this function to reduce the
 // complexity of FormatOption.
 int Decoder::FormatRegister(Instr* instr, const char* format) {
   ASSERT(format[0] == 'r');
   if (format[1] == 'n') {  // 'rn: Rn register
     int reg = instr->RnField();
     PrintRegister(reg);
     return 2;
   } else if (format[1] == 'd') {  // 'rd: Rd register
     int reg = instr->RdField();
     PrintRegister(reg);
     return 2;
   } else if (format[1] == 's') {  // 'rs: Rs register
     int reg = instr->RsField();
     PrintRegister(reg);
     return 2;
   } else if (format[1] == 'm') {  // 'rm: Rm register
     int reg = instr->RmField();
     PrintRegister(reg);
     return 2;
   } else if (format[1] == 't') {  // 'rt: Rt register
     int reg = instr->RtField();
     PrintRegister(reg);
     return 2;
   } else if (format[1] == 'l') {
     // 'rlist: register list for load and store multiple instructions
     ASSERT(STRING_STARTS_WITH(format, "rlist"));
     int rlist = instr->RlistField();
     int reg = 0;
     Print("{");
     // Print register list in ascending order, by scanning the bit mask.
     while (rlist != 0) {
       if ((rlist & 1) != 0) {
         PrintRegister(reg);
         if ((rlist >> 1) != 0) {
           Print(", ");
         }
       }
       reg++;
       rlist >>= 1;
     }
     Print("}");
     return 5;
   }
   UNREACHABLE();
   return -1;
 }


 // Handle all VFP register based formatting in this function to reduce the
 // complexity of FormatOption.
 int Decoder::FormatVFPRegister(Instr* instr, const char* format) {
   ASSERT((format[0] == 'S') || (format[0] == 'D'));

   if (format[1] == 'n') {
     int reg = instr->VnField();
     if (format[0] == 'S') PrintSRegister(((reg << 1) | instr->NField()));
     if (format[0] == 'D') PrintDRegister(reg);
     return 2;
   } else if (format[1] == 'm') {
     int reg = instr->VmField();
     if (format[0] == 'S') PrintSRegister(((reg << 1) | instr->MField()));
     if (format[0] == 'D') PrintDRegister(reg);
     return 2;
   } else if (format[1] == 'd') {
     int reg = instr->VdField();
     if (format[0] == 'S') PrintSRegister(((reg << 1) | instr->DField()));
     if (format[0] == 'D') PrintDRegister(reg);
     return 2;
   }

   UNREACHABLE();
   return -1;
 }


 int Decoder::FormatVFPinstruction(Instr* instr, const char* format) {
     Print(format);
     return 0;
 }


 // FormatOption takes a formatting string and interprets it based on
 // the current instructions. The format string points to the first
 // character of the option string (the option escape has already been
 // consumed by the caller.)  FormatOption returns the number of
 // characters that were consumed from the formatting string.
 int Decoder::FormatOption(Instr* instr, const char* format) {
   switch (format[0]) {
     case 'a': {  // 'a: accumulate multiplies
       if (instr->Bit(21) == 0) {
         Print("ul");
       } else {
         Print("la");
       }
       return 1;
     }
     case 'b': {  // 'b: byte loads or stores
       if (instr->HasB()) {
         Print("b");
       }
       return 1;
     }
     case 'c': {  // 'cond: conditional execution
       ASSERT(STRING_STARTS_WITH(format, "cond"));
       PrintCondition(instr);
       return 4;
     }
     case 'h': {  // 'h: halfword operation for extra loads and stores
       if (instr->HasH()) {
         Print("h");
       } else {
         Print("b");
       }
       return 1;
     }
     case 'l': {  // 'l: branch and link
       if (instr->HasLink()) {
         Print("l");
       }
       return 1;
     }
     case 'm': {
       if (format[1] == 'e') {  // 'memop: load/store instructions
         ASSERT(STRING_STARTS_WITH(format, "memop"));
         if (instr->HasL()) {
           Print("ldr");
         } else {
           Print("str");
         }
         return 5;
       }
       // 'msg: for simulator break instructions
       ASSERT(STRING_STARTS_WITH(format, "msg"));
       byte* str =
           reinterpret_cast<byte*>(instr->InstructionBits() & 0x0fffffff);
       out_buffer_pos_ += v8i::OS::SNPrintF(out_buffer_ + out_buffer_pos_,
                                            "%s", converter_.NameInCode(str));
       return 3;
     }
     case 'o': {
       if ((format[3] == '1') && (format[4] == '2')) {
         // 'off12: 12-bit offset for load and store instructions
         ASSERT(STRING_STARTS_WITH(format, "off12"));
         out_buffer_pos_ += v8i::OS::SNPrintF(out_buffer_ + out_buffer_pos_,
                                              "%d", instr->Offset12Field());
         return 5;
       } else if ((format[3] == '1') && (format[4] == '6')) {
         ASSERT(STRING_STARTS_WITH(format, "off16to20"));
         out_buffer_pos_ += v8i::OS::SNPrintF(out_buffer_ + out_buffer_pos_,
                                            "%d", instr->Bits(20, 16) +1);
         return 9;
       } else if (format[3] == '7') {
         ASSERT(STRING_STARTS_WITH(format, "off7to11"));
         out_buffer_pos_ += v8i::OS::SNPrintF(out_buffer_ + out_buffer_pos_,
                                             "%d", instr->ShiftAmountField());
         return 8;
       }
       // 'off8: 8-bit offset for extra load and store instructions
       ASSERT(STRING_STARTS_WITH(format, "off8"));
       int offs8 = (instr->ImmedHField() << 4) | instr->ImmedLField();
       out_buffer_pos_ += v8i::OS::SNPrintF(out_buffer_ + out_buffer_pos_,
                                            "%d", offs8);
       return 4;
     }
     case 'p': {  // 'pu: P and U bits for load and store instructions
       ASSERT(STRING_STARTS_WITH(format, "pu"));
       PrintPU(instr);
       return 2;
     }
     case 'r': {
       return FormatRegister(instr, format);
     }
     case 's': {
       if (format[1] == 'h') {  // 'shift_op or 'shift_rm
         if (format[6] == 'o') {  // 'shift_op
           ASSERT(STRING_STARTS_WITH(format, "shift_op"));
           if (instr->TypeField() == 0) {
             PrintShiftRm(instr);
           } else {
             ASSERT(instr->TypeField() == 1);
             PrintShiftImm(instr);
           }
           return 8;
         } else {  // 'shift_rm
           ASSERT(STRING_STARTS_WITH(format, "shift_rm"));
           PrintShiftRm(instr);
           return 8;
         }
       } else if (format[1] == 'w') {  // 'swi
         ASSERT(STRING_STARTS_WITH(format, "swi"));
         PrintSoftwareInterrupt(instr->SwiField());
         return 3;
       } else if (format[1] == 'i') {  // 'sign: signed extra loads and stores
         ASSERT(STRING_STARTS_WITH(format, "sign"));
         if (instr->HasSign()) {
           Print("s");
         }
         return 4;
       }
       // 's: S field of data processing instructions
       if (instr->HasS()) {
         Print("s");
       }
       return 1;
     }
     case 't': {  // 'target: target of branch instructions
       ASSERT(STRING_STARTS_WITH(format, "target"));
       int off = (instr->SImmed24Field() << 2) + 8;
       out_buffer_pos_ += v8i::OS::SNPrintF(
           out_buffer_ + out_buffer_pos_,
           "%+d -> %s",
           off,
           converter_.NameOfAddress(reinterpret_cast<byte*>(instr) + off));
       return 6;
     }
     case 'u': {  // 'u: signed or unsigned multiplies
       // The manual gets the meaning of bit 22 backwards in the multiply
       // instruction overview on page A3.16.2.  The instructions that
       // exist in u and s variants are the following:
       // smull A4.1.87
       // umull A4.1.129
       // umlal A4.1.128
       // smlal A4.1.76
       // For these 0 means u and 1 means s.  As can be seen on their individual
       // pages.  The other 18 mul instructions have the bit set or unset in
       // arbitrary ways that are unrelated to the signedness of the instruction.
       // None of these 18 instructions exist in both a 'u' and an 's' variant.

       if (instr->Bit(22) == 0) {
         Print("u");
       } else {
         Print("s");
       }
       return 1;
     }
     case 'v': {
       return FormatVFPinstruction(instr, format);
     }
     case 'S':
     case 'D': {
       return FormatVFPRegister(instr, format);
     }
     case 'w': {  // 'w: W field of load and store instructions
       if (instr->HasW()) {
         Print("!");
       }
       return 1;
     }
     default: {
       UNREACHABLE();
       break;
     }
   }
   UNREACHABLE();
   return -1;
 }


 // Format takes a formatting string for a whole instruction and prints it into
 // the output buffer. All escaped options are handed to FormatOption to be
 // parsed further.
 void Decoder::Format(Instr* instr, const char* format) {
   char cur = *format++;
   while ((cur != 0) && (out_buffer_pos_ < (out_buffer_.length() - 1))) {
     if (cur == '\'') {  // Single quote is used as the formatting escape.
       format += FormatOption(instr, format);
     } else {
       out_buffer_[out_buffer_pos_++] = cur;
     }
     cur = *format++;
   }
   out_buffer_[out_buffer_pos_]  = '\0';
 }


 // For currently unimplemented decodings the disassembler calls Unknown(instr)
 // which will just print "unknown" of the instruction bits.
 void Decoder::Unknown(Instr* instr) {
   Format(instr, "unknown");
 }


 void Decoder::DecodeType01(Instr* instr) {
   int type = instr->TypeField();
   if ((type == 0) && instr->IsSpecialType0()) {
     // multiply instruction or extra loads and stores
     if (instr->Bits(7, 4) == 9) {
       if (instr->Bit(24) == 0) {
         // multiply instructions
         if (instr->Bit(23) == 0) {
           if (instr->Bit(21) == 0) {
             // The MUL instruction description (A 4.1.33) refers to Rd as being
             // the destination for the operation, but it confusingly uses the
             // Rn field to encode it.
             Format(instr, "mul'cond's 'rn, 'rm, 'rs");
           } else {
             // The MLA instruction description (A 4.1.28) refers to the order
             // of registers as "Rd, Rm, Rs, Rn". But confusingly it uses the
             // Rn field to encode the Rd register and the Rd field to encode
             // the Rn register.
             Format(instr, "mla'cond's 'rn, 'rm, 'rs, 'rd");
           }
         } else {
           // The signed/long multiply instructions use the terms RdHi and RdLo
           // when referring to the target registers. They are mapped to the Rn
           // and Rd fields as follows:
           // RdLo == Rd field
           // RdHi == Rn field
           // The order of registers is: <RdLo>, <RdHi>, <Rm>, <Rs>
           Format(instr, "'um'al'cond's 'rd, 'rn, 'rm, 'rs");
         }
       } else {
         Unknown(instr);  // not used by V8
       }
     } else {
       // extra load/store instructions
       switch (instr->PUField()) {
         case 0: {
           if (instr->Bit(22) == 0) {
             Format(instr, "'memop'cond'sign'h 'rd, ['rn], -'rm");
           } else {
             Format(instr, "'memop'cond'sign'h 'rd, ['rn], #-'off8");
           }
           break;
         }
         case 1: {
           if (instr->Bit(22) == 0) {
             Format(instr, "'memop'cond'sign'h 'rd, ['rn], +'rm");
           } else {
             Format(instr, "'memop'cond'sign'h 'rd, ['rn], #+'off8");
           }
           break;
         }
         case 2: {
           if (instr->Bit(22) == 0) {
             Format(instr, "'memop'cond'sign'h 'rd, ['rn, -'rm]'w");
           } else {
             Format(instr, "'memop'cond'sign'h 'rd, ['rn, #-'off8]'w");
           }
           break;
         }
         case 3: {
           if (instr->Bit(22) == 0) {
             Format(instr, "'memop'cond'sign'h 'rd, ['rn, +'rm]'w");
           } else {
             Format(instr, "'memop'cond'sign'h 'rd, ['rn, #+'off8]'w");
           }
           break;
         }
         default: {
           // The PU field is a 2-bit field.
           UNREACHABLE();
           break;
         }
       }
       return;
     }
   } else {
     switch (instr->OpcodeField()) {
       case AND: {
         Format(instr, "and'cond's 'rd, 'rn, 'shift_op");
         break;
       }
       case EOR: {
         Format(instr, "eor'cond's 'rd, 'rn, 'shift_op");
         break;
       }
       case SUB: {
         Format(instr, "sub'cond's 'rd, 'rn, 'shift_op");
         break;
       }
       case RSB: {
         Format(instr, "rsb'cond's 'rd, 'rn, 'shift_op");
         break;
       }
       case ADD: {
         Format(instr, "add'cond's 'rd, 'rn, 'shift_op");
         break;
       }
       case ADC: {
         Format(instr, "adc'cond's 'rd, 'rn, 'shift_op");
         break;
       }
       case SBC: {
         Format(instr, "sbc'cond's 'rd, 'rn, 'shift_op");
         break;
       }
       case RSC: {
         Format(instr, "rsc'cond's 'rd, 'rn, 'shift_op");
         break;
       }
       case TST: {
         if (instr->HasS()) {
           Format(instr, "tst'cond 'rn, 'shift_op");
         } else {
           Unknown(instr);  // not used by V8
         }
         break;
       }
       case TEQ: {
         if (instr->HasS()) {
           Format(instr, "teq'cond 'rn, 'shift_op");
         } else {
           switch (instr->Bits(7, 4)) {
             case BX:
               Format(instr, "bx'cond 'rm");
               break;
             case BLX:
               Format(instr, "blx'cond 'rm");
               break;
             default:
               Unknown(instr);  // not used by V8
               break;
           }
         }
         break;
       }
       case CMP: {
         if (instr->HasS()) {
           Format(instr, "cmp'cond 'rn, 'shift_op");
         } else {
           Unknown(instr);  // not used by V8
         }
         break;
       }
       case CMN: {
         if (instr->HasS()) {
           Format(instr, "cmn'cond 'rn, 'shift_op");
         } else {
           switch (instr->Bits(7, 4)) {
             case CLZ:
               Format(instr, "clz'cond 'rd, 'rm");
               break;
             default:
               Unknown(instr);  // not used by V8
               break;
           }
         }
         break;
       }
       case ORR: {
         Format(instr, "orr'cond's 'rd, 'rn, 'shift_op");
         break;
       }
       case MOV: {
         Format(instr, "mov'cond's 'rd, 'shift_op");
         break;
       }
       case BIC: {
         Format(instr, "bic'cond's 'rd, 'rn, 'shift_op");
         break;
       }
       case MVN: {
         Format(instr, "mvn'cond's 'rd, 'shift_op");
         break;
       }
       default: {
         // The Opcode field is a 4-bit field.
         UNREACHABLE();
         break;
       }
     }
   }
 }


 void Decoder::DecodeType2(Instr* instr) {
   switch (instr->PUField()) {
     case 0: {
       if (instr->HasW()) {
         Unknown(instr);  // not used in V8
       }
       Format(instr, "'memop'cond'b 'rd, ['rn], #-'off12");
       break;
     }
     case 1: {
       if (instr->HasW()) {
         Unknown(instr);  // not used in V8
       }
       Format(instr, "'memop'cond'b 'rd, ['rn], #+'off12");
       break;
     }
     case 2: {
       Format(instr, "'memop'cond'b 'rd, ['rn, #-'off12]'w");
       break;
     }
     case 3: {
       Format(instr, "'memop'cond'b 'rd, ['rn, #+'off12]'w");
       break;
     }
     default: {
       // The PU field is a 2-bit field.
       UNREACHABLE();
       break;
     }
   }
 }


 void Decoder::DecodeType3(Instr* instr) {
   switch (instr->PUField()) {
     case 0: {
       ASSERT(!instr->HasW());
       Format(instr, "'memop'cond'b 'rd, ['rn], -'shift_rm");
       break;
     }
     case 1: {
       ASSERT(!instr->HasW());
       Format(instr, "'memop'cond'b 'rd, ['rn], +'shift_rm");
       break;
     }
     case 2: {
       Format(instr, "'memop'cond'b 'rd, ['rn, -'shift_rm]'w");
       break;
     }
     case 3: {
       if (instr->HasW() && (instr->Bits(6, 4) == 0x5)) {
         uint32_t widthminus1 = static_cast<uint32_t>(instr->Bits(20, 16));
         uint32_t lsbit = static_cast<uint32_t>(instr->ShiftAmountField());
         uint32_t msbit = widthminus1 + lsbit;
         if (msbit <= 31) {
           Format(instr, "ubfx'cond 'rd, 'rm, #'off7to11, #'off16to20");
         } else {
           UNREACHABLE();
         }
       } else {
         Format(instr, "'memop'cond'b 'rd, ['rn, +'shift_rm]'w");
       }
       break;
     }
     default: {
       // The PU field is a 2-bit field.
       UNREACHABLE();
       break;
     }
   }
 }


 void Decoder::DecodeType4(Instr* instr) {
   ASSERT(instr->Bit(22) == 0);  // Privileged mode currently not supported.
   if (instr->HasL()) {
     Format(instr, "ldm'cond'pu 'rn'w, 'rlist");
   } else {
     Format(instr, "stm'cond'pu 'rn'w, 'rlist");
   }
 }


 void Decoder::DecodeType5(Instr* instr) {
   Format(instr, "b'l'cond 'target");
 }


 void Decoder::DecodeType6(Instr* instr) {
   DecodeType6CoprocessorIns(instr);
 }


 void Decoder::DecodeType7(Instr* instr) {
   if (instr->Bit(24) == 1) {
     Format(instr, "swi'cond 'swi");
   } else {
     DecodeTypeVFP(instr);
   }
 }

 void Decoder::DecodeUnconditional(Instr* instr) {
   if (instr->Bits(7, 4) == 0xB && instr->Bits(27, 25) == 0 && instr->HasL()) {
     Format(instr, "'memop'h'pu 'rd, ");
     bool immediate = instr->HasB();
     switch (instr->PUField()) {
       case 0: {
         // Post index, negative.
         if (instr->HasW()) {
           Unknown(instr);
           break;
         }
         if (immediate) {
           Format(instr, "['rn], #-'imm12");
         } else {
           Format(instr, "['rn], -'rm");
         }
         break;
       }
       case 1: {
         // Post index, positive.
         if (instr->HasW()) {
           Unknown(instr);
           break;
         }
         if (immediate) {
           Format(instr, "['rn], #+'imm12");
         } else {
           Format(instr, "['rn], +'rm");
         }
         break;
       }
       case 2: {
         // Pre index or offset, negative.
         if (immediate) {
           Format(instr, "['rn, #-'imm12]'w");
         } else {
           Format(instr, "['rn, -'rm]'w");
         }
         break;
       }
       case 3: {
         // Pre index or offset, positive.
         if (immediate) {
           Format(instr, "['rn, #+'imm12]'w");
         } else {
           Format(instr, "['rn, +'rm]'w");
         }
         break;
       }
       default: {
         // The PU field is a 2-bit field.
         UNREACHABLE();
         break;
       }
     }
     return;
   }
   Format(instr, "break 'msg");
 }


 // void Decoder::DecodeTypeVFP(Instr* instr)
 // vmov: Sn = Rt
 // vmov: Rt = Sn
 // vcvt: Dd = Sm
 // vcvt: Sd = Dm
 // Dd = vadd(Dn, Dm)
 // Dd = vsub(Dn, Dm)
 // Dd = vmul(Dn, Dm)
 // Dd = vdiv(Dn, Dm)
 // vcmp(Dd, Dm)
 // VMRS
 void Decoder::DecodeTypeVFP(Instr* instr) {
   ASSERT((instr->TypeField() == 7) && (instr->Bit(24) == 0x0) );

   if (instr->Bit(23) == 1) {
     if ((instr->Bits(21, 19) == 0x7) &&
         (instr->Bits(18, 16) == 0x5) &&
         (instr->Bits(11, 9) == 0x5) &&
         (instr->Bit(8) == 1) &&
         (instr->Bit(6) == 1) &&
         (instr->Bit(4) == 0)) {
       Format(instr, "vcvt.s32.f64'cond 'Sd, 'Dm");
     } else if ((instr->Bits(21, 19) == 0x7) &&
                (instr->Bits(18, 16) == 0x0) &&
                (instr->Bits(11, 9) == 0x5) &&
                (instr->Bit(8) == 1) &&
                (instr->Bit(7) == 1) &&
                (instr->Bit(6) == 1) &&
                (instr->Bit(4) == 0)) {
       Format(instr, "vcvt.f64.s32'cond 'Dd, 'Sm");
     } else if ((instr->Bit(21) == 0x0) &&
                (instr->Bit(20) == 0x0) &&
                (instr->Bits(11, 9) == 0x5) &&
                (instr->Bit(8) == 1) &&
                (instr->Bit(6) == 0) &&
                (instr->Bit(4) == 0)) {
         Format(instr, "vdiv.f64'cond 'Dd, 'Dn, 'Dm");
     } else if ((instr->Bits(21, 20) == 0x3) &&
                (instr->Bits(19, 16) == 0x4) &&
                (instr->Bits(11, 9) == 0x5) &&
                (instr->Bit(8) == 0x1) &&
                (instr->Bit(6) == 0x1) &&
                (instr->Bit(4) == 0x0)) {
       Format(instr, "vcmp.f64'cond 'Dd, 'Dm");
     } else if ((instr->Bits(23, 20) == 0xF) &&
                (instr->Bits(19, 16) == 0x1) &&
                (instr->Bits(11, 8) == 0xA) &&
                (instr->Bits(7, 5) == 0x0) &&
                (instr->Bit(4) == 0x1)    &&
                (instr->Bits(3, 0) == 0x0)) {
         if (instr->Bits(15, 12) == 0xF)
           Format(instr, "vmrs'cond APSR, FPSCR");
         else
           Unknown(instr);  // Not used by V8.
     } else {
       Unknown(instr);  // Not used by V8.
     }
   } else if (instr->Bit(21) == 1) {
     if ((instr->Bit(20) == 0x1) &&
         (instr->Bits(11, 9) == 0x5) &&
         (instr->Bit(8) == 0x1) &&
         (instr->Bit(6) == 0) &&
         (instr->Bit(4) == 0)) {
       Format(instr, "vadd.f64'cond 'Dd, 'Dn, 'Dm");
     } else if ((instr->Bit(20) == 0x1) &&
                (instr->Bits(11, 9) == 0x5) &&
                (instr->Bit(8) == 0x1) &&
                (instr->Bit(6) == 1) &&
                (instr->Bit(4) == 0)) {
       Format(instr, "vsub.f64'cond 'Dd, 'Dn, 'Dm");
     } else if ((instr->Bit(20) == 0x0) &&
                (instr->Bits(11, 9) == 0x5) &&
                (instr->Bit(8) == 0x1) &&
                (instr->Bit(6) == 0) &&
                (instr->Bit(4) == 0)) {
       Format(instr, "vmul.f64'cond 'Dd, 'Dn, 'Dm");
     } else {
       Unknown(instr);  // Not used by V8.
     }
   } else {
     if ((instr->Bit(20) == 0x0) &&
         (instr->Bits(11, 8) == 0xA) &&
         (instr->Bits(6, 5) == 0x0) &&
         (instr->Bit(4) == 1) &&
         (instr->Bits(3, 0) == 0x0)) {
       Format(instr, "vmov'cond 'Sn, 'rt");
     } else if ((instr->Bit(20) == 0x1) &&
                (instr->Bits(11, 8) == 0xA) &&
                (instr->Bits(6, 5) == 0x0) &&
                (instr->Bit(4) == 1) &&
                (instr->Bits(3, 0) == 0x0)) {
       Format(instr, "vmov'cond 'rt, 'Sn");
     } else {
       Unknown(instr);  // Not used by V8.
     }
   }
 }


 // Decode Type 6 coprocessor instructions.
 // Dm = vmov(Rt, Rt2)
 // <Rt, Rt2> = vmov(Dm)
 // Ddst = MEM(Rbase + 4*offset).
 // MEM(Rbase + 4*offset) = Dsrc.
 void Decoder::DecodeType6CoprocessorIns(Instr* instr) {
   ASSERT((instr->TypeField() == 6));

   if (instr->CoprocessorField() != 0xB) {
     Unknown(instr);  // Not used by V8.
   } else {
     switch (instr->OpcodeField()) {
       case 0x2:
         // Load and store double to two GP registers
         if (instr->Bits(7, 4) != 0x1) {
           Unknown(instr);  // Not used by V8.
         } else if (instr->HasL()) {
           Format(instr, "vmov'cond 'rt, 'rn, 'Dm");
         } else {
           Format(instr, "vmov'cond 'Dm, 'rt, 'rn");
         }
         break;
       case 0x8:
         if (instr->HasL()) {
           Format(instr, "vldr'cond 'Dd, ['rn - 4*'off8]");
         } else {
           Format(instr, "vstr'cond 'Dd, ['rn - 4*'off8]");
         }
         break;
       case 0xC:
         if (instr->HasL()) {
           Format(instr, "vldr'cond 'Dd, ['rn + 4*'off8]");
         } else {
           Format(instr, "vstr'cond 'Dd, ['rn + 4*'off8]");
         }
         break;
       default:
         Unknown(instr);  // Not used by V8.
         break;
     }
   }
 }


 // Disassemble the instruction at *instr_ptr into the output buffer.
 int Decoder::InstructionDecode(byte* instr_ptr) {
   Instr* instr = Instr::At(instr_ptr);
   // Print raw instruction bytes.
   out_buffer_pos_ += v8i::OS::SNPrintF(out_buffer_ + out_buffer_pos_,
                                        "%08x       ",
                                        instr->InstructionBits());
   if (instr->ConditionField() == special_condition) {
     DecodeUnconditional(instr);
     return Instr::kInstrSize;
   }
   switch (instr->TypeField()) {
     case 0:
     case 1: {
       DecodeType01(instr);
       break;
     }
     case 2: {
       DecodeType2(instr);
       break;
     }
     case 3: {
       DecodeType3(instr);
       break;
     }
     case 4: {
       DecodeType4(instr);
       break;
     }
     case 5: {
       DecodeType5(instr);
       break;
     }
     case 6: {
       DecodeType6(instr);
       break;
     }
     case 7: {
       DecodeType7(instr);
       break;
     }
     default: {
       // The type field is 3-bits in the ARM encoding.
       UNREACHABLE();
       break;
     }
   }
   return Instr::kInstrSize;
 }


 } }  // namespace assembler::arm


 //------------------------------------------------------------------------------

 namespace disasm {

 namespace v8i = v8::internal;


 const char* NameConverter::NameOfAddress(byte* addr) const {
   static v8::internal::EmbeddedVector<char, 32> tmp_buffer;
   v8::internal::OS::SNPrintF(tmp_buffer, "%p", addr);
   return tmp_buffer.start();
 }


 const char* NameConverter::NameOfConstant(byte* addr) const {
   return NameOfAddress(addr);
 }


 const char* NameConverter::NameOfCPURegister(int reg) const {
   return assembler::arm::Registers::Name(reg);
 }


 const char* NameConverter::NameOfByteCPURegister(int reg) const {
   UNREACHABLE();  // ARM does not have the concept of a byte register
   return "nobytereg";
 }


 const char* NameConverter::NameOfXMMRegister(int reg) const {
   UNREACHABLE();  // ARM does not have any XMM registers
   return "noxmmreg";
 }


 const char* NameConverter::NameInCode(byte* addr) const {
   // The default name converter is called for unknown code. So we will not try
   // to access any memory.
   return "";
 }


 //------------------------------------------------------------------------------

 Disassembler::Disassembler(const NameConverter& converter)
     : converter_(converter) {}


 Disassembler::~Disassembler() {}


 int Disassembler::InstructionDecode(v8::internal::Vector<char> buffer,
                                     byte* instruction) {
   assembler::arm::Decoder d(converter_, buffer);
   return d.InstructionDecode(instruction);
 }


 int Disassembler::ConstantPoolSizeAt(byte* instruction) {
   int instruction_bits = *(reinterpret_cast<int*>(instruction));
   if ((instruction_bits & 0xfff00000) == 0x03000000) {
     return instruction_bits & 0x0000ffff;
   } else {
     return -1;
   }
 }


 void Disassembler::Disassemble(FILE* f, byte* begin, byte* end) {
   NameConverter converter;
   Disassembler d(converter);
   for (byte* pc = begin; pc < end;) {
     v8::internal::EmbeddedVector<char, 128> buffer;
     buffer[0] = '\0';
     byte* prev_pc = pc;
     pc += d.InstructionDecode(buffer, pc);
     fprintf(f, "%p    %08x      %s\n",
             prev_pc, *reinterpret_cast<int32_t*>(prev_pc), buffer.start());
   }
 }


 }  // namespace disasm