1 files changed, 141 insertions, 103 deletions
diff --git a/courgette/disassembler_elf_32_arm.cc b/courgette/disassembler_elf_32_arm.cc
index f6490d9..39172f4 100644
--- a/courgette/disassembler_elf_32_arm.cc
+++ b/courgette/disassembler_elf_32_arm.cc
@@ -4,18 +4,12 @@
 
 #include "courgette/disassembler_elf_32_arm.h"
 
-#include <stddef.h>
-#include <stdint.h>
-
-#include <algorithm>
-#include <string>
 #include <vector>
 
 #include "base/logging.h"
-
+#include "base/memory/scoped_ptr.h"
 #include "courgette/assembly_program.h"
 #include "courgette/courgette.h"
-#include "courgette/encoded_program.h"
 
 namespace courgette {
 
@@ -24,31 +18,34 @@ CheckBool DisassemblerElf32ARM::Compress(ARM_RVA type,
                                          RVA rva,
                                          uint16_t* c_op,
                                          uint32_t* addr) {
-  // This method takes an ARM or thumb opcode, extracts the relative
-  // target address from it (addr), and creates a corresponding
-  // Courgette opcode (c_op).
-  //
-  // Details on ARM the opcodes, and how the relative targets are
-  // computed were taken from the "ARM Architecture Reference Manual",
-  // section A4.1.5 and the "Thumb-2 supplement", section 4.6.12.
-  // ARM_OFF24 is for the ARM opcode.  The rest are for thumb opcodes.
+  // Notation for bit ranges in comments:
+  // - Listing bits from highest to lowest.
+  // - A-Z or (j1), (j2), etc.: single bit in source.
+  // - a-z: multiple, consecutive bits in source.
   switch (type) {
     case ARM_OFF8: {
-      // The offset is given by lower 8 bits of the op.  It is a 9-bit
-      // offset, shifted right one bit and signed extended.
+      // Encoding T1.
+      // The offset is given by lower 8 bits of the op.  It is a 9-bit offset,
+      // shifted right 1 bit, and signed extended.
+      // arm_op = aaaaaaaa Snnnnnnn
+      // *addr := SSSSSSSS SSSSSSSS SSSSSSSS nnnnnnn0 + 100
+      // *c_op := 00010000 aaaaaaaa
       uint32_t temp = (arm_op & 0x00FF) << 1;
       if (temp & 0x0100)
         temp |= 0xFFFFFE00;
       temp += 4;  // Offset from _next_ PC.
-      fflush(stdout);
 
       (*addr) = temp;
       (*c_op) = static_cast<uint16_t>(arm_op >> 8) | 0x1000;
       break;
     }
     case ARM_OFF11: {
-      // The offset is given by lower 11 bits of the op, and is a
-      // 12-bit offset, shifted right one bit and sign extended.
+      // Encoding T2.
+      // The offset is given by lower 11 bits of the op, and is a 12-bit offset,
+      // shifted right 1 bit, and sign extended.
+      // arm_op = aaaaaSnn nnnnnnnn
+      // *addr := SSSSSSSS SSSSSSSS SSSSSnnn nnnnnnn0 + 100
+      // *c_op := 00100000 000aaaaa
       uint32_t temp = (arm_op & 0x07FF) << 1;
       if (temp & 0x00000800)
         temp |= 0xFFFFF000;
@@ -61,6 +58,9 @@ CheckBool DisassemblerElf32ARM::Compress(ARM_RVA type,
     case ARM_OFF24: {
       // The offset is given by the lower 24-bits of the op, shifted
       // left 2 bits, and sign extended.
+      // arm_op = aaaaaaaa Snnnnnnn nnnnnnnn nnnnnnnn
+      // *addr := SSSSSSSn nnnnnnnn nnnnnnnn nnnnnn00 + 1000
+      // *c_op := 00110000 aaaaaaaa
       uint32_t temp = (arm_op & 0x00FFFFFF) << 2;
       if (temp & 0x02000000)
         temp |= 0xFC000000;
@@ -71,6 +71,18 @@ CheckBool DisassemblerElf32ARM::Compress(ARM_RVA type,
       break;
     }
     case ARM_OFF25: {
+      // Encoding T4.
+      // arm_op = aaaaaSmm mmmmmmmm BC(j1)D(j2)nnn nnnnnnnn
+      //   where CD is in {01, 10, 11}
+      // i1 := ~(j1 ^ S)
+      // i2 := ~(j2 ^ S)
+      // If CD == 10:
+      //   pppp := (rva % 4 == 0) ? 0100 : 0010
+      // Else:
+      //   pppp := 0100
+      // *addr := SSSSSSSS (i1)(i2)mmmmmm mmmmnnnn nnnnnnn0 + pppp
+      // *c_op := 0100pppp aaaaaBCD
+      // TODO(huangs): aaaaa = 11110 and B = 1 always? Investigate and fix.
       uint32_t temp = 0;
       temp |= (arm_op & 0x000007FF) << 1;  // imm11
       temp |= (arm_op & 0x03FF0000) >> 4;  // imm10
@@ -78,8 +90,8 @@ CheckBool DisassemblerElf32ARM::Compress(ARM_RVA type,
       uint32_t S = (arm_op & (1 << 26)) >> 26;
       uint32_t j2 = (arm_op & (1 << 11)) >> 11;
       uint32_t j1 = (arm_op & (1 << 13)) >> 13;
-      bool bit12 = ((arm_op & (1 << 12)) >> 12) != 0;
-      bool bit14 = ((arm_op & (1 << 14)) >> 14) != 0;
+      bool bit12 = ((arm_op & (1 << 12)) >> 12) != 0;  // D
+      bool bit14 = ((arm_op & (1 << 14)) >> 14) != 0;  // C
 
       uint32_t i2 = ~(j2 ^ S) & 1;
       uint32_t i1 = ~(j1 ^ S) & 1;
@@ -91,7 +103,7 @@ CheckBool DisassemblerElf32ARM::Compress(ARM_RVA type,
         temp |= 0xFE000000;
       uint32_t prefetch;
       if (toARM) {
-        // Align PC on 4-byte boundary
+        // Align PC on 4-byte boundary.
         uint32_t align4byte = (rva % 4) ? 2 : 4;
         prefetch = align4byte;
       } else {
@@ -101,20 +113,25 @@ CheckBool DisassemblerElf32ARM::Compress(ARM_RVA type,
       (*addr) = temp;
 
       uint32_t temp2 = 0x4000;
-      temp2 |= (arm_op & (1 << 12)) >> 12;
-      temp2 |= (arm_op & (1 << 14)) >> 13;
-      temp2 |= (arm_op & (1 << 15)) >> 13;
-      temp2 |= (arm_op & 0xF8000000) >> 24;
+      temp2 |= (arm_op & (1 << 12)) >> 12;   // .......D
+      temp2 |= (arm_op & (1 << 14)) >> 13;   // ......C.
+      temp2 |= (arm_op & (1 << 15)) >> 13;   // .....B..
+      temp2 |= (arm_op & 0xF8000000) >> 24;  // aaaaa...
       temp2 |= (prefetch & 0x0000000F) << 8;
       (*c_op) = static_cast<uint16_t>(temp2);
       break;
     }
     case ARM_OFF21: {
+      // Encoding T3.
+      // arm_op = 11110Scc ccmmmmmm 10(j1)0(j2)nnn nnnnnnnn
+      // *addr := SSSSSSSS SSSS(j1)(j2)mm mmmmnnnn nnnnnnn0 + 100
+      // *c_op := 01010000 0000cccc
       uint32_t temp = 0;
       temp |= (arm_op & 0x000007FF) << 1;  // imm11
       temp |= (arm_op & 0x003F0000) >> 4;  // imm6
 
       uint32_t S = (arm_op & (1 << 26)) >> 26;
+      // TODO(huangs): Check with docs: Perhaps j1, j2 should swap?
       uint32_t j2 = (arm_op & (1 << 11)) >> 11;
       uint32_t j1 = (arm_op & (1 << 13)) >> 13;
 
@@ -140,20 +157,31 @@ CheckBool DisassemblerElf32ARM::Decompress(ARM_RVA type,
                                            uint16_t c_op,
                                            uint32_t addr,
                                            uint32_t* arm_op) {
-  // Reverses the process in the compress() method.  Takes the
-  // Courgette op and relative address and reconstructs the original
-  // ARM or thumb op.
   switch (type) {
     case ARM_OFF8:
+      // addr     = SSSSSSSS SSSSSSSS SSSSSSSS nnnnnnn0 + 100
+      // c_op     = 00010000 aaaaaaaa
+      // *arm_op := aaaaaaaa Snnnnnnn
       (*arm_op) = ((c_op & 0x0FFF) << 8) | (((addr - 4) >> 1) & 0x000000FF);
       break;
     case ARM_OFF11:
+      // addr     = SSSSSSSS SSSSSSSS SSSSSnnn nnnnnnn0 + 100
+      // c_op     = 00100000 000aaaaa
+      // *arm_op := aaaaaSnn nnnnnnnn
       (*arm_op) = ((c_op & 0x0FFF) << 11) | (((addr - 4) >> 1) & 0x000007FF);
       break;
     case ARM_OFF24:
+      // addr     = SSSSSSSn nnnnnnnn nnnnnnnn nnnnnn00 + 1000
+      // c_op     = 00110000 aaaaaaaa
+      // *arm_op := aaaaaaaa Snnnnnnn nnnnnnnn nnnnnnnn
       (*arm_op) = ((c_op & 0x0FFF) << 24) | (((addr - 8) >> 2) & 0x00FFFFFF);
       break;
     case ARM_OFF25: {
+      // addr     = SSSSSSSS (i1)(i2)mmmmmm mmmmnnnn nnnnnnn0 + pppp
+      // c_op     = 0100pppp aaaaaBCD
+      // j1      := ~i1 ^ S
+      // j2      := ~i2 ^ S
+      // *arm_op := aaaaaSmm mmmmmmmm BC(j1)D(j2)nnn nnnnnnnn
       uint32_t temp = 0;
       temp |= (c_op & (1 << 0)) << 12;
       temp |= (c_op & (1 << 1)) << 13;
@@ -183,6 +211,9 @@ CheckBool DisassemblerElf32ARM::Decompress(ARM_RVA type,
       break;
     }
     case ARM_OFF21: {
+      // addr     = SSSSSSSS SSSS(j1)(j2)mm mmmmnnnn nnnnnnn0 + 100
+      // c_op     = 01010000 0000cccc
+      // *arm_op := 11110Scc ccmmmmmm 10(j1)0(j2)nnn nnnnnnnn
       uint32_t temp = 0xF0008000;
       temp |= (c_op & (0x03C00000 >> 22)) << 22;
 
@@ -230,24 +261,28 @@ CheckBool DisassemblerElf32ARM::TypedRVAARM::ComputeRelativeTarget(
     const uint8_t* op_pointer) {
   arm_op_ = op_pointer;
   switch (type_) {
-    case ARM_OFF8:
-      // Fall through
+    case ARM_OFF8:  // Falls through.
     case ARM_OFF11: {
       RVA relative_target;
-      CheckBool ret = Compress(type_, Read16LittleEndian(op_pointer), rva(),
-                               &c_op_, &relative_target);
+      CheckBool ret = Compress(type_,
+                               Read16LittleEndian(op_pointer),
+                               rva(),
+                               &c_op_,
+                               &relative_target);
       set_relative_target(relative_target);
       return ret;
     }
     case ARM_OFF24: {
       RVA relative_target;
-      CheckBool ret = Compress(type_, Read32LittleEndian(op_pointer), rva(),
-                               &c_op_, &relative_target);
+      CheckBool ret = Compress(type_,
+                               Read32LittleEndian(op_pointer),
+                               rva(),
+                               &c_op_,
+                               &relative_target);
       set_relative_target(relative_target);
       return ret;
     }
-    case ARM_OFF25:
-      // Fall through
+    case ARM_OFF25:  // Falls through.
     case ARM_OFF21: {
       // A thumb-2 op is 32 bits stored as two 16-bit words
       uint32_t pval = (Read16LittleEndian(op_pointer) << 16) |
@@ -272,26 +307,24 @@ CheckBool DisassemblerElf32ARM::TypedRVAARM::EmitInstruction(
 }
 
 DisassemblerElf32ARM::DisassemblerElf32ARM(const void* start, size_t length)
-  : DisassemblerElf32(start, length) {
+    : DisassemblerElf32(start, length) {
 }
 
-// Convert an ELF relocation struction into an RVA
+// Convert an ELF relocation struction into an RVA.
 CheckBool DisassemblerElf32ARM::RelToRVA(Elf32_Rel rel, RVA* result) const {
-
-  // The rightmost byte of r_info is the type...
+  // The rightmost byte of r_info is the type.
   elf32_rel_arm_type_values type =
-      (elf32_rel_arm_type_values)(unsigned char)rel.r_info;
+      static_cast<elf32_rel_arm_type_values>(rel.r_info & 0xFF);
 
-  // The other 3 bytes of r_info are the symbol
+  // The other 3 bytes of r_info are the symbol.
   uint32_t symbol = rel.r_info >> 8;
 
-  switch(type)
-  {
+  switch (type) {
     case R_ARM_RELATIVE:
       if (symbol != 0)
         return false;
 
-      // This is a basic ABS32 relocation address
+      // This is a basic ABS32 relocation address.
       *result = rel.r_offset;
       return true;
 
@@ -301,32 +334,33 @@ CheckBool DisassemblerElf32ARM::RelToRVA(Elf32_Rel rel, RVA* result) const {
 }
 
 CheckBool DisassemblerElf32ARM::ParseRelocationSection(
-    const Elf32_Shdr *section_header,
-      AssemblyProgram* program) {
-  // This method compresses a contiguous stretch of R_ARM_RELATIVE
-  // entries in the relocation table with a Courgette relocation table
-  // instruction.  It skips any entries at the beginning that appear
-  // in a section that Courgette doesn't support, e.g. INIT.
+    const Elf32_Shdr* section_header,
+    AssemblyProgram* program) {
+  // This method compresses a contiguous stretch of R_ARM_RELATIVE entries in
+  // the relocation table with a Courgette relocation table instruction.
+  // It skips any entries at the beginning that appear in a section that
+  // Courgette doesn't support, e.g. INIT.
+  //
   // Specifically, the entries should be
   //   (1) In the same relocation table
   //   (2) Are consecutive
   //   (3) Are sorted in memory address order
   //
-  // Happily, this is normally the case, but it's not required by spec
-  // so we check, and just don't do it if we don't match up.
+  // Happily, this is normally the case, but it's not required by spec so we
+  // check, and just don't do it if we don't match up.
   //
-  // The expectation is that one relocation section will contain
-  // all of our R_ARM_RELATIVE entries in the expected order followed
-  // by assorted other entries we can't use special handling for.
+  // The expectation is that one relocation section will contain all of our
+  // R_ARM_RELATIVE entries in the expected order followed by assorted other
+  // entries we can't use special handling for.
 
   bool match = true;
 
-  // Walk all the bytes in the section, matching relocation table or not
-  size_t file_offset = section_header->sh_offset;
-  size_t section_end = section_header->sh_offset + section_header->sh_size;
+  // Walk all the bytes in the section, matching relocation table or not.
+  FileOffset file_offset = section_header->sh_offset;
+  FileOffset section_end = section_header->sh_offset + section_header->sh_size;
 
-  Elf32_Rel *section_relocs_iter =
-      (Elf32_Rel *)OffsetToPointer(section_header->sh_offset);
+  const Elf32_Rel* section_relocs_iter = reinterpret_cast<const Elf32_Rel*>(
+      FileOffsetToPointer(section_header->sh_offset));
 
   uint32_t section_relocs_count =
       section_header->sh_size / section_header->sh_entsize;
@@ -337,13 +371,15 @@ CheckBool DisassemblerElf32ARM::ParseRelocationSection(
   if (!abs32_locations_.empty()) {
     std::vector<RVA>::iterator reloc_iter = abs32_locations_.begin();
 
-    for (uint32_t i = 0; i < section_relocs_count; i++) {
+    for (uint32_t i = 0; i < section_relocs_count; ++i) {
       if (section_relocs_iter->r_offset == *reloc_iter)
         break;
 
-      if (!ParseSimpleRegion(file_offset, file_offset + sizeof(Elf32_Rel),
-                             program))
+      if (!ParseSimpleRegion(file_offset,
+                             file_offset + sizeof(Elf32_Rel),
+                             program)) {
         return false;
+      }
 
       file_offset += sizeof(Elf32_Rel);
       ++section_relocs_iter;
@@ -351,11 +387,12 @@ CheckBool DisassemblerElf32ARM::ParseRelocationSection(
 
     while (match && (reloc_iter != abs32_locations_.end())) {
       if (section_relocs_iter->r_info != R_ARM_RELATIVE ||
-          section_relocs_iter->r_offset != *reloc_iter)
+          section_relocs_iter->r_offset != *reloc_iter) {
         match = false;
+      }
 
-      section_relocs_iter++;
-      reloc_iter++;
+      ++section_relocs_iter;
+      ++reloc_iter;
       file_offset += sizeof(Elf32_Rel);
     }
 
@@ -369,118 +406,119 @@ CheckBool DisassemblerElf32ARM::ParseRelocationSection(
   return ParseSimpleRegion(file_offset, section_end, program);
 }
 
+// TODO(huangs): Detect and avoid overlap with abs32 addresses.
 CheckBool DisassemblerElf32ARM::ParseRel32RelocsFromSection(
     const Elf32_Shdr* section_header) {
-  uint32_t start_file_offset = section_header->sh_offset;
-  uint32_t end_file_offset = start_file_offset + section_header->sh_size;
+  FileOffset start_file_offset = section_header->sh_offset;
+  FileOffset end_file_offset = start_file_offset + section_header->sh_size;
 
-  const uint8_t* start_pointer = OffsetToPointer(start_file_offset);
-  const uint8_t* end_pointer = OffsetToPointer(end_file_offset);
+  const uint8_t* start_pointer = FileOffsetToPointer(start_file_offset);
+  const uint8_t* end_pointer = FileOffsetToPointer(end_file_offset);
 
   // Quick way to convert from Pointer to RVA within a single Section is to
-  // subtract 'pointer_to_rva'.
+  // subtract |pointer_to_rva|.
   const uint8_t* const adjust_pointer_to_rva =
       start_pointer - section_header->sh_addr;
 
   // Find the rel32 relocations.
   const uint8_t* p = start_pointer;
-  bool on_32bit = 1; // 32-bit ARM ops appear on 32-bit boundaries, so track it
+  bool on_32bit = 1;  // 32-bit ARM ops appear on 32-bit boundaries, so track it
   while (p < end_pointer) {
     // Heuristic discovery of rel32 locations in instruction stream: are the
     // next few bytes the start of an instruction containing a rel32
     // addressing mode?
-
-    TypedRVAARM* rel32_rva = NULL;
+    scoped_ptr<TypedRVAARM> rel32_rva;
     RVA target_rva = 0;
     bool found = false;
 
     // 16-bit thumb ops
-    if (!found && (p + 3) <= end_pointer) {
+    if (!found && p + 3 <= end_pointer) {
       uint16_t pval = Read16LittleEndian(p);
       if ((pval & 0xF000) == 0xD000) {
         RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva);
 
-        rel32_rva = new TypedRVAARM(ARM_OFF8, rva);
-        if (!rel32_rva->ComputeRelativeTarget((uint8_t*)p)) {
+        rel32_rva.reset(new TypedRVAARM(ARM_OFF8, rva));
+        if (!rel32_rva->ComputeRelativeTarget(p))
           return false;
-        }
+
         target_rva = rel32_rva->rva() + rel32_rva->relative_target();
         found = true;
       } else if ((pval & 0xF800) == 0xE000) {
         RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva);
 
-        rel32_rva = new TypedRVAARM(ARM_OFF11, rva);
-        if (!rel32_rva->ComputeRelativeTarget((uint8_t*)p)) {
+        rel32_rva.reset(new TypedRVAARM(ARM_OFF11, rva));
+        if (!rel32_rva->ComputeRelativeTarget(p))
           return false;
-        }
+
         target_rva = rel32_rva->rva() + rel32_rva->relative_target();
         found = true;
       }
     }
 
-    // thumb-2 ops comprised of two 16-bit words
-    if (!found && (p + 5) <= end_pointer) {
+    // thumb-2 ops comprised of two 16-bit words.
+    if (!found && p + 5 <= end_pointer) {
       // This is really two 16-bit words, not one 32-bit word.
       uint32_t pval = (Read16LittleEndian(p) << 16) | Read16LittleEndian(p + 2);
       if ((pval & 0xF8008000) == 0xF0008000) {
         // Covers thumb-2's 32-bit conditional/unconditional branches
-
-        if ( (pval & (1 << 14)) || (pval & (1 << 12)) ) {
+        if ((pval & (1 << 14)) || (pval & (1 << 12))) {
           // A branch, with link, or with link and exchange.
           RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva);
 
-          rel32_rva = new TypedRVAARM(ARM_OFF25, rva);
-          if (!rel32_rva->ComputeRelativeTarget((uint8_t*)p)) {
+          rel32_rva.reset(new TypedRVAARM(ARM_OFF25, rva));
+          if (!rel32_rva->ComputeRelativeTarget(p))
             return false;
-          }
+
           target_rva = rel32_rva->rva() + rel32_rva->relative_target();
           found = true;
+
         } else {
           // TODO(paulgazz) make sure cond is not 111
           // A conditional branch instruction
           RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva);
 
-          rel32_rva = new TypedRVAARM(ARM_OFF21, rva);
-          if (!rel32_rva->ComputeRelativeTarget((uint8_t*)p)) {
+          rel32_rva.reset(new TypedRVAARM(ARM_OFF21, rva));
+          if (!rel32_rva->ComputeRelativeTarget(p))
             return false;
-          }
+
           target_rva = rel32_rva->rva() + rel32_rva->relative_target();
           found = true;
         }
       }
     }
 
-    // 32-bit ARM ops
+    // 32-bit ARM ops.
     if (!found && on_32bit && (p + 5) <= end_pointer) {
       uint32_t pval = Read32LittleEndian(p);
       if ((pval & 0x0E000000) == 0x0A000000) {
         // Covers both 0x0A 0x0B ARM relative branches
         RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva);
 
-        rel32_rva = new TypedRVAARM(ARM_OFF24, rva);
-        if (!rel32_rva->ComputeRelativeTarget((uint8_t*)p)) {
+        rel32_rva.reset(new TypedRVAARM(ARM_OFF24, rva));
+        if (!rel32_rva->ComputeRelativeTarget(p))
           return false;
-        }
+
         target_rva = rel32_rva->rva() + rel32_rva->relative_target();
         found = true;
       }
     }
 
-    if (found && IsValidRVA(target_rva)) {
-      rel32_locations_.push_back(rel32_rva);
+    if (found && IsValidTargetRVA(target_rva)) {
+      uint16_t op_size = rel32_rva->op_size();
+      rel32_locations_.push_back(rel32_rva.release());
 #if COURGETTE_HISTOGRAM_TARGETS
       ++rel32_target_rvas_[target_rva];
 #endif
-      p += rel32_rva->op_size();
+      p += op_size;
 
-      // A tricky way to update the on_32bit flag.  Here is the truth table:
+      // A tricky way to update the on_32bit flag. Here is the truth table:
       // on_32bit | on_32bit   size is 4
       // ---------+---------------------
       // 1        | 0          0
       // 0        | 0          1
       // 0        | 1          0
       // 1        | 1          1
-      on_32bit = (~(on_32bit ^ (rel32_rva->op_size() == 4))) != 0;
+      on_32bit = (~(on_32bit ^ (op_size == 4))) != 0;
     } else {
       // Move 2 bytes at a time, but track 32-bit boundaries
       p += 2;