Represent UNW_INDEX table column-wise for better search locality

The UNW_INDEX table has 2 columns: address and index. This table is represented column wise so that binary search uses lesser number of pages and it is easier to represent the memory map as arrays of primitive types. BUG=819888 Change-Id: I7f3245cfc1526425aed414fe89ee01661b914a40 Reviewed-on: https://chromium-review.googlesource.com/985151 Commit-Queue: Siddhartha S <ssid@chromium.org> Reviewed-by: agrieve <agrieve@chromium.org> Cr-Commit-Position: refs/heads/master@{#547855}

Represent UNW_INDEX table column-wise for better search locality
The UNW_INDEX table has 2 columns: address and index. This table is represented column wise so that binary search uses lesser number of pages and it is easier to represent the memory map as arrays of primitive types. BUG=819888 Change-Id: I7f3245cfc1526425aed414fe89ee01661b914a40 Reviewed-on: https://chromium-review.googlesource.com/985151 Commit-Queue: Siddhartha S <ssid@chromium.org> Reviewed-by: agrieve <agrieve@chromium.org> Cr-Commit-Position: refs/heads/master@{#547855}
56c8ecc0 · Siddhartha · Commit Bot · a4c343c8 · 56c8ecc0 · 56c8ecc0
Commit 56c8ecc0 authored Apr 03, 2018 by Siddhartha Committed by Commit Bot Apr 03, 2018
5 changed files
--- a/base/trace_event/cfi_backtrace_android.cc
+++ b/base/trace_event/cfi_backtrace_android.cc
@@ -33,11 +33,13 @@ EHABI format. The first table contains function addresses and an index into the
 UNW_DATA table. The second table contains one or more rows for the function
 unwind information.
-The output file starts with 4 bytes counting the size of UNW_INDEX in bytes.
+UNW_INDEX contains two columns of N rows each, where N is the number of
-Then UNW_INDEX table and UNW_DATA table.
+functions.
-UNW_INDEX contains one row for each function. Each row is 6 bytes long:
+  1. First column 4 byte rows of all the function start address as offset from
-  4 bytes: Function start address.
+     start of the binary, in sorted order.
-  2 bytes: offset (in count of 2 bytes) of function data from start of UNW_DATA.
+  2. For each function addr, the second column contains 2 byte indices in order.
+     The indices are offsets (in count of 2 bytes) of the CFI data from start of
+     UNW_DATA.
 The last entry in the table always contains CANT_UNWIND index to specify the
 end address of the last function.
@@ -83,30 +85,6 @@ constexpr uint16_t kRAShift = 2;
 static_assert(sizeof(uintptr_t) == 4,
              "The unwind table format is only valid for 32 bit builds.");
-// The struct that corresponds to each row in the UNW_INDEX table. The first 4
-// bytes in the row represents the address of the function w.r.t. to the start
-// of the binary and the next 2 bytes have the index. The members of this struct
-// is in order of the input format. We cast the memory map of the unwind table
-// as an array of CFIUnwindIndexRow and use it to read data and search. So, the
-// size of this struct should be 6 bytes and the order of the members is fixed
-// according to the given format.
-struct CFIUnwindIndexRow {
-  // Declare all the members of the function with size 2 bytes to make sure the
-  // alignment is 2 bytes and the struct is not padded to 8 bytes. The |addr_l|
-  // and |addr_r| represent the lower and higher 2 bytes of the function
-  // address.
-  uint16_t addr_l;
-  uint16_t addr_r;
-  // The |index| is count in terms of 2 byte address into the UNW_DATA table,
-  // where the CFI data of the function exists.
-  uint16_t index;
-  // Returns the address of the function as offset from the start of the binary,
-  // to which the index row corresponds to.
-  uintptr_t addr() const { return (addr_r << 16) | addr_l; }
-};
 // The CFI data in UNW_DATA table starts with number of rows (N) and then
 // followed by N rows of 4 bytes long. The CFIUnwindDataRow represents a single
 // row of CFI data of a function in the table. Since we cast the memory at the
@@ -130,10 +108,6 @@ struct CFIUnwindDataRow {
  size_t cfa_offset() const { return cfi_data & kCFAMask; }
 };
-static_assert(
-    sizeof(CFIUnwindIndexRow) == 6,
-    "The CFIUnwindIndexRow struct must be exactly 6 bytes for searching.");
 static_assert(
    sizeof(CFIUnwindDataRow) == 4,
    "The CFIUnwindDataRow struct must be exactly 4 bytes for searching.");
@@ -173,22 +147,28 @@ void CFIBacktraceAndroid::Initialize() {
  if (!cfi_mmap_->Initialize(base::File(fd), cfi_region))
    return;
-  // The first 4 bytes in the file is the size of UNW_INDEX table. The UNW_INDEX
+  ParseCFITables();
-  // table contains rows of 6 bytes each.
+  can_unwind_stack_frames_ = true;
+}
+void CFIBacktraceAndroid::ParseCFITables() {
+  // The first 4 bytes in the file is the size of UNW_INDEX table.
+  static constexpr size_t kUnwIndexRowSize =
+      sizeof(*unw_index_function_col_) + sizeof(*unw_index_indices_col_);
  size_t unw_index_size = 0;
  memcpy(&unw_index_size, cfi_mmap_->data(), sizeof(unw_index_size));
-  DCHECK_EQ(0u, unw_index_size % sizeof(CFIUnwindIndexRow));
+  DCHECK_EQ(0u, unw_index_size % kUnwIndexRowSize);
-  DCHECK_GT(cfi_region.size, unw_index_size);
+  // UNW_INDEX table starts after 4 bytes.
-  unw_index_start_addr_ =
+  unw_index_function_col_ =
-      reinterpret_cast<const size_t*>(cfi_mmap_->data()) + 1;
+      reinterpret_cast<const uintptr_t*>(cfi_mmap_->data()) + 1;
-  unw_index_row_count_ = unw_index_size / sizeof(CFIUnwindIndexRow);
+  unw_index_row_count_ = unw_index_size / kUnwIndexRowSize;
+  unw_index_indices_col_ = reinterpret_cast<const uint16_t*>(
+      unw_index_function_col_ + unw_index_row_count_);
  // The UNW_DATA table data is right after the end of UNW_INDEX table.
  // Interpret the UNW_DATA table as an array of 2 byte numbers since the
  // indexes we have from the UNW_INDEX table are in terms of 2 bytes.
-  unw_data_start_addr_ = reinterpret_cast<const uint16_t*>(
+  unw_data_start_addr_ = unw_index_indices_col_ + unw_index_row_count_;
-      reinterpret_cast<uintptr_t>(unw_index_start_addr_) + unw_index_size);
-  can_unwind_stack_frames_ = true;
 }
 size_t CFIBacktraceAndroid::Unwind(const void** out_trace,
@@ -232,39 +212,37 @@ size_t CFIBacktraceAndroid::Unwind(const void** out_trace,
 bool CFIBacktraceAndroid::FindCFIRowForPC(
    uintptr_t func_addr,
    CFIBacktraceAndroid::CFIRow* cfi) const {
-  // Consider the UNW_TABLE as an array of CFIUnwindIndexRow since each row
+  // Consider each column of UNW_INDEX table as arrays of uintptr_t (function
-  // is 6 bytes long and it contains |unw_index_size_| / 6 rows. We define
+  // addresses) and uint16_t (indices). Define start and end iterator on the
-  // start and end iterator on this array and use std::lower_bound() to binary
+  // first column array (addresses) and use std::lower_bound() to binary search
-  // search on this array. std::lower_bound() returns the row that corresponds
+  // on this array to find the required function address.
-  // to the first row that has address greater than the current value, since
+  static const uintptr_t* const unw_index_fn_end =
-  // address is used in compartor.
+      unw_index_function_col_ + unw_index_row_count_;
-  const CFIUnwindIndexRow* start =
+  const uintptr_t* found =
-      static_cast<const CFIUnwindIndexRow*>(unw_index_start_addr_);
+      std::lower_bound(unw_index_function_col_, unw_index_fn_end, func_addr);
-  const CFIUnwindIndexRow* end = start + unw_index_row_count_;
-  const CFIUnwindIndexRow to_find = {func_addr & 0xffff, func_addr >> 16, 0};
-  const CFIUnwindIndexRow* found = std::lower_bound(
-      start, end, to_find,
-      [](const auto& a, const auto& b) { return a.addr() < b.addr(); });
  *cfi = {0};
  // If found is start, then the given function is not in the table. If the
  // given pc is start of a function then we cannot unwind.
-  if (found == start || found->addr() == func_addr)
+  if (found == unw_index_function_col_ || *found == func_addr)
    return false;
-  // The required row is always one less than the value returned by
+  // std::lower_bound() returns the iter that corresponds to the first address
-  // std::lower_bound().
+  // that is greater than the given address. So, the required iter is always one
-  found--;
+  // less than the value returned by std::lower_bound().
-  uintptr_t func_start_addr = found->addr();
+  --found;
+  uintptr_t func_start_addr = *found;
+  size_t row_num = found - unw_index_function_col_;
+  uint16_t index = unw_index_indices_col_[row_num];
  DCHECK_LE(func_start_addr, func_addr);
  // If the index is CANT_UNWIND then we do not have unwind infomation for the
  // function.
-  if (found->index == kCantUnwind)
+  if (index == kCantUnwind)
    return false;
  // The unwind data for the current function is at an offsset of the index
  // found in UNW_INDEX table.
-  const uint16_t* unwind_data = unw_data_start_addr_ + found->index;
+  const uint16_t* unwind_data = unw_data_start_addr_ + index;
  // The value of first 2 bytes is the CFI data row count for the function.
  uint16_t row_count = 0;
  memcpy(&row_count, unwind_data, sizeof(row_count));

--- a/base/trace_event/cfi_backtrace_android.h
+++ b/base/trace_event/cfi_backtrace_android.h
@@ -81,6 +81,9 @@ class BASE_EXPORT CFIBacktraceAndroid {
  // still reduce the total amount of address space available in process.
  void Initialize();
+  // Finds the UNW_INDEX and UNW_DATA tables in from the CFI file memory map.
+  void ParseCFITables();
  // Finds the CFI row for the given |func_addr| in terms of offset from
  // the start of the current binary.
  bool FindCFIRowForPC(uintptr_t func_addr, CFIRow* out) const;
@@ -94,8 +97,13 @@ class BASE_EXPORT CFIBacktraceAndroid {
  // because it is replaced in tests.
  std::unique_ptr<MemoryMappedFile> cfi_mmap_;
-  // The start address of UNW_IDX table.
+  // The UNW_INDEX table: Start address of the function address column. The
-  const void* unw_index_start_addr_ = nullptr;
+  // memory segment corresponding to this column is treated as an array of
+  // uintptr_t.
+  const uintptr_t* unw_index_function_col_ = nullptr;
+  // The UNW_INDEX table: Start address of the index column. The memory segment
+  // corresponding to this column is treated as an array of uint16_t.
+  const uint16_t* unw_index_indices_col_ = nullptr;
  // The number of rows in UNW_INDEX table.
  size_t unw_index_row_count_ = 0;

--- a/base/trace_event/cfi_backtrace_android_unittest.cc
+++ b/base/trace_event/cfi_backtrace_android_unittest.cc
@@ -66,13 +66,20 @@ TEST(CFIBacktraceAndroidTest, TestFindCFIRow) {
  STACK CFI INIT 2200 10
  STACK CFI 2204 .cfa: sp 44 + .ra: .cfa -8 + ^ r4: .cfa -16 + ^
  */
-  uint16_t input[] = {0x2A,   0x0,    0x1000, 0x0,    0x0,    0x1502, 0x0,
+  uint16_t input[] = {// UNW_INDEX size
-                      0xffff, 0x2000, 0x0,    0xb,    0x2024, 0x0,    0x10,
+                      0x2A,
-                      0x2126, 0x0,    0xffff, 0x2200, 0x0,    0x15,   0x2212,
-                      0x0,    0xffff, 0x5,    0x2,    0x111,  0x8,    0x220,
+                      // UNW_INDEX address column (4 byte rows).
-                      0x40,   0x330,  0x50,   0x332,  0x80,   0x220,  0x2,
+                      0x0, 0x1000, 0x0, 0x1502, 0x0, 0x2000, 0x0, 0x2024, 0x0,
-                      0x4,    0x13,   0x8,    0x13,   0x2,    0xc,    0x33,
+                      0x2126, 0x0, 0x2200, 0x0, 0x2212, 0x0,
-                      0xdc,   0x40,   0x1,    0x4,    0x2e};
+                      // UNW_INDEX index column (2 byte rows).
+                      0x0, 0xffff, 0xb, 0x10, 0xffff, 0x15, 0xffff,
+                      // UNW_DATA table.
+                      0x5, 0x2, 0x111, 0x8, 0x220, 0x40, 0x330, 0x50, 0x332,
+                      0x80, 0x220, 0x2, 0x4, 0x13, 0x8, 0x13, 0x2, 0xc, 0x33,
+                      0xdc, 0x40, 0x1, 0x4, 0x2e};
  FilePath temp_path;
  CreateTemporaryFile(&temp_path);
  EXPECT_EQ(
@@ -81,11 +88,7 @@ TEST(CFIBacktraceAndroidTest, TestFindCFIRow) {
  unwinder->cfi_mmap_.reset(new MemoryMappedFile());
  unwinder->cfi_mmap_->Initialize(temp_path);
-  unwinder->unw_index_start_addr_ =
+  unwinder->ParseCFITables();
-      reinterpret_cast<const size_t*>(unwinder->cfi_mmap_->data()) + 1;
-  unwinder->unw_index_row_count_ = input[0] / 6;
-  unwinder->unw_data_start_addr_ = reinterpret_cast<const uint16_t*>(
-      reinterpret_cast<uintptr_t>(unwinder->unw_index_start_addr_) + input[0]);
  CFIBacktraceAndroid::CFIRow cfi_row = {0};
  EXPECT_FALSE(unwinder->FindCFIRowForPC(0x00, &cfi_row));

--- a/build/android/gyp/extract_unwind_tables.py
+++ b/build/android/gyp/extract_unwind_tables.py
@@ -22,9 +22,14 @@ unwind information.
 The output file starts with 4 bytes counting the size of UNW_INDEX in bytes.
 Then UNW_INDEX table and UNW_DATA table.
-UNW_INDEX contains one row for each function. Each row is 6 bytes long:
-  4 bytes: Function start address.
+UNW_INDEX contains two columns of N rows each, where N is the number of
-  2 bytes: offset (in count of 2 bytes) of function data from start of UNW_DATA.
+functions.
+  1. First column 4 byte rows of all the function start address as offset from
+     start of the binary, in sorted order.
+  2. For each function addr, the second column contains 2 byte indices in order.
+     The indices are offsets (in count of 2 bytes) of the CFI data from start of
+     UNW_DATA.
 The last entry in the table always contains CANT_UNWIND index to specify the
 end address of the last function.
@@ -237,9 +242,11 @@ def _WriteCfiData(cfi_data, out_file):
  # Write the size of UNW_INDEX file in bytes.
  _Write4Bytes(out_file, len(func_addr_to_index) * 6)
-  # Write the UNW_INDEX table.
+  # Write the UNW_INDEX table. First list of addresses and then indices.
-  for addr, index in sorted(func_addr_to_index.iteritems()):
+  sorted_unw_index = sorted(func_addr_to_index.iteritems())
+  for addr, index in sorted_unw_index:
    _Write4Bytes(out_file, addr)
+  for addr, index in sorted_unw_index:
    _Write2Bytes(out_file, index)
  # Write the UNW_DATA table.

--- a/build/android/gyp/extract_unwind_tables_tests.py
+++ b/build/android/gyp/extract_unwind_tables_tests.py
@@ -92,16 +92,18 @@ STACK CFI 3b93218 .cfa: r7 16 + .ra: .cfa -4 + ^
      # |actual_output| is in blocks of 2 bytes. Skip first 4 bytes representing
      # size.
      unw_index_start = 2
-      unw_index_end = unw_index_start + unw_index_size / 2
+      unw_index_addr_end = unw_index_start + expected_function_count * 2
-      unw_index = actual_output[unw_index_start: unw_index_end]
+      unw_index_end = unw_index_addr_end + expected_function_count
+      unw_index_addr_col = actual_output[unw_index_start : unw_index_addr_end]
+      unw_index_index_col = actual_output[unw_index_addr_end : unw_index_end]
      unw_data_start = unw_index_end
      unw_data = actual_output[unw_data_start:]
      for func_iter in range(0, expected_function_count):
-        func_addr = (unw_index[func_iter * 3 + 1] << 16 |
+        func_addr = (unw_index_addr_col[func_iter * 2 + 1] << 16 |
-                     unw_index[func_iter * 3])
+                     unw_index_addr_col[func_iter * 2])
-        index = unw_index[func_iter * 3 + 2]
+        index = unw_index_index_col[func_iter]
        # If index is CANT_UNWIND then invalid function.
        if index == 0xFFFF:
          self.assertEqual(expected_cfi_data[func_addr], [])