Merge branch 'master' into ignore-declarations

commit: 58b103866b45cc534a860c136ac82ae8caa16f46 [log] [tgz]
author: Joshua Haberman <jhaberman@gmail.com> Sun Aug 08 16:25:54 2021 -0700
committer: Joshua Haberman <jhaberman@gmail.com> Sun Aug 08 16:25:54 2021 -0700
tree: 01250b008546e2912260faf6fba30ef228881864
parent: c952309265f1a888338ef1ea3fd3ec6d1f279b73 [diff]
parent: 90bac14f8ffc25414957ec05dff2dc66dbef937f [diff]
diff --git a/.github/workflows/cifuzz.yml b/.github/workflows/cifuzz.yml
new file mode 100644
index 0000000..0f33604
--- /dev/null
+++ b/.github/workflows/cifuzz.yml

@@ -0,0 +1,29 @@
+name: CIFuzz
+on: [pull_request]
+jobs:
+ Fuzzing:
+   runs-on: ubuntu-latest
+   strategy:
+     fail-fast: false
+     matrix:
+       sanitizer: [address, undefined]
+   steps:
+   - name: Build Fuzzers (${{ matrix.sanitizer }})
+     uses: google/oss-fuzz/infra/cifuzz/actions/build_fuzzers@master
+     with:
+       oss-fuzz-project-name: 'bloaty'
+       dry-run: false
+       sanitizer: ${{ matrix.sanitizer }}
+   - name: Run Fuzzers (${{ matrix.sanitizer }})
+     uses: google/oss-fuzz/infra/cifuzz/actions/run_fuzzers@master
+     with:
+       oss-fuzz-project-name: 'bloaty'
+       fuzz-seconds: 600
+       dry-run: false
+       sanitizer: ${{ matrix.sanitizer }}
+   - name: Upload Crash
+     uses: actions/upload-artifact@v1
+     if: failure()
+     with:
+       name: ${{ matrix.sanitizer }}-artifacts
+       path: ./out/artifacts

diff --git a/CMakeLists.txt b/CMakeLists.txt
index d0d65ed..4e73f60 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt

@@ -118,7 +118,7 @@
   endif()
   if(NOT ZLIB_FOUND)
     add_subdirectory(third_party/zlib)
-    include_directories(third_party/zlib)
+    include_directories(SYSTEM third_party/zlib)
   endif()
 else()
   if(BLOATY_ENABLE_RE2)
@@ -223,8 +223,14 @@
     src/bloaty.h
     src/disassemble.cc
     ${CMAKE_CURRENT_BINARY_DIR}/src/bloaty.pb.cc
+    src/dwarf/attr.h
+    src/dwarf/attr.cc
+    src/dwarf/dwarf_util.cc
+    src/dwarf/debug_info.cc
+    src/dwarf/line_info.cc
     src/dwarf.cc
     src/dwarf_constants.h
+    src/eh_frame.cc
     src/elf.cc
     src/macho.cc
     src/pe.cc
@@ -282,7 +288,7 @@
   if(ZLIB_FOUND)
     list(APPEND LIBBLOATY_LIBS ZLIB::ZLIB)
   else()
-    list(APPEND LIBBLOATY_LIBS zlib)
+    list(APPEND LIBBLOATY_LIBS zlibstatic)
   endif()
 else()
   set(LIBBLOATY_LIBS libbloaty libprotoc capstone-static)

diff --git a/README.md b/README.md
index a83d4c7..98d9c80 100644
--- a/README.md
+++ b/README.md

@@ -54,7 +54,7 @@
 - **easy to deploy:** statically-linked C++ binary, easy to copy around
 
 For detailed info on all of Bloaty's features, see the [User
-Documentation](docs/using.md).
+Documentation](doc/using.md).
 
 For more information about the analysis performed by Bloaty,
 please see [How Bloaty Works](doc/how-bloaty-works.md).

diff --git a/src/bloaty.cc b/src/bloaty.cc
index 62fcbb3..f4bd554 100644
--- a/src/bloaty.cc
+++ b/src/bloaty.cc

@@ -12,6 +12,14 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
+#include <stddef.h>
+
+// For some reason this isn't getting defined by zconf.h in 32-bit builds.
+// It's very hard to figure out why. For the moment this seems to fix it,
+// but ideally we'd have a better solution here.
+typedef size_t z_size_t;
+#include <zlib.h>
+
 #include <atomic>
 #include <cmath>
 #include <fstream>
@@ -41,7 +49,6 @@
 #endif
 #include <sys/stat.h>
 #include <sys/types.h>
-#include <zlib.h>
 
 #include "absl/debugging/internal/demangle.h"
 #include "absl/memory/memory.h"
@@ -158,72 +165,12 @@
   }
 }
 
-
-// LineReader / LineIterator ///////////////////////////////////////////////////
-
-// Convenience code for iterating over lines of a pipe.
-
-#if !defined(_MSC_VER)
-LineReader::LineReader(LineReader&& other) {
-  Close();
-
-  file_ = other.file_;
-  pclose_ = other.pclose_;
-
-  other.file_ = nullptr;
-}
-
-void LineReader::Close() {
-  if (!file_) return;
-
-  if (pclose_) {
-    pclose(file_);
-  } else {
-    fclose(file_);
-  }
-}
-
-void LineReader::Next() {
-  char buf[256];
-  line_.clear();
-  do {
-    if (!fgets(buf, sizeof(buf), file_)) {
-      if (feof(file_)) {
-        eof_ = true;
-        break;
-      } else {
-        std::cerr << "Error reading from file.\n";
-        exit(1);
-      }
-    }
-    line_.append(buf);
-  } while(!eof_ && line_[line_.size() - 1] != '\n');
-
-  if (!eof_) {
-    line_.resize(line_.size() - 1);
-  }
-}
-
-LineIterator LineReader::begin() { return LineIterator(this); }
-LineIterator LineReader::end() { return LineIterator(nullptr); }
-
-LineReader ReadLinesFromPipe(const std::string& cmd) {
-  FILE* pipe = popen(cmd.c_str(), "r");
-
-  if (!pipe) {
-    std::cerr << "Failed to run command: " << cmd << "\n";
-    exit(1);
-  }
-
-  return LineReader(pipe, true);
-}
-#endif
-
 extern "C" char* __cxa_demangle(const char* mangled_name, char* buf, size_t* n,
                                 int* status);
 
 std::string ItaniumDemangle(string_view symbol, DataSource source) {
-  if (source == DataSource::kRawSymbols) {
+  if (source != DataSource::kShortSymbols &&
+      source != DataSource::kFullSymbols) {
     // No demangling.
     return std::string(symbol);
   }
@@ -1349,6 +1296,15 @@
   if (!arena_) {
     THROW("This range sink isn't prepared to zlib decompress.");
   }
+  uint64_t mb = 1 << 20;
+  // Limit for uncompressed size is 30x the compressed size + 128MB.
+  if (uncompressed_size > static_cast<uint64_t>(data.size()) * 30 + (128 * mb)) {
+    fprintf(stderr,
+            "warning: ignoring compressed debug data, implausible uncompressed "
+            "size (compressed: %zu, uncompressed: %" PRIu64 ")\n",
+            data.size(), uncompressed_size);
+    return absl::string_view();
+  }
   unsigned char *dbuf =
       arena_->google::protobuf::Arena::CreateArray<unsigned char>(
           arena_, uncompressed_size);
@@ -1616,7 +1572,7 @@
   void PrintMaps(const std::vector<const RangeMap*> maps) {
     uint64_t last = 0;
     uint64_t max = maps[0]->GetMaxAddress();
-    int hex_digits = std::ceil(std::log2(max) / 4);
+    int hex_digits = max > 0 ? std::ceil(std::log2(max) / 4) : 0;
     RangeMap::ComputeRollup(maps, [&](const std::vector<std::string>& keys,
                                       uint64_t addr, uint64_t end) {
       if (addr > last) {

diff --git a/src/bloaty.h b/src/bloaty.h
index e5a1128..9ed2be0 100644
--- a/src/bloaty.h
+++ b/src/bloaty.h

@@ -35,6 +35,7 @@
 #include "absl/strings/strip.h"
 #include "capstone/capstone.h"
 
+#include "dwarf/debug_info.h"
 #include "bloaty.pb.h"
 #include "range_map.h"
 #include "re.h"
@@ -290,99 +291,15 @@
 std::unique_ptr<ObjectFile> TryOpenWebAssemblyFile(std::unique_ptr<InputFile>& file);
 std::unique_ptr<ObjectFile> TryOpenPEFile(std::unique_ptr<InputFile>& file);
 
-namespace dwarf {
-
-struct File {
-  absl::string_view debug_abbrev;
-  absl::string_view debug_addr;
-  absl::string_view debug_aranges;
-  absl::string_view debug_info;
-  absl::string_view debug_line;
-  absl::string_view debug_loc;
-  absl::string_view debug_pubnames;
-  absl::string_view debug_pubtypes;
-  absl::string_view debug_ranges;
-  absl::string_view debug_rnglists;
-  absl::string_view debug_str;
-  absl::string_view debug_str_offsets;
-  absl::string_view debug_types;
-
-  absl::string_view* GetFieldByName(absl::string_view name);
-  void SetFieldByName(absl::string_view name, absl::string_view contents) {
-    absl::string_view *member = GetFieldByName(name);
-    if (member) *member = contents;
-  }
-};
-
-}  // namespace dwarf
-
 // Provided by dwarf.cc.  To use these, a module should fill in a dwarf::File
 // and then call these functions.
-void ReadDWARFCompileUnits(const dwarf::File& file, const SymbolTable& symtab,
-                           const DualMap& map, RangeSink* sink);
+void ReadDWARFCompileUnits(const dwarf::File& file, const DualMap& map,
+                           RangeSink* sink);
 void ReadDWARFInlines(const dwarf::File& file, RangeSink* sink,
                       bool include_line);
 void ReadEhFrame(absl::string_view contents, RangeSink* sink);
 void ReadEhFrameHdr(absl::string_view contents, RangeSink* sink);
 
-
-// LineReader //////////////////////////////////////////////////////////////////
-
-// Provides range-based for to iterate over lines in a pipe.
-//
-// for ( auto& line : ReadLinesFromPipe("ls -l") ) {
-// }
-
-class LineIterator;
-
-class LineReader {
- public:
-  LineReader(FILE* file, bool pclose) : file_(file), pclose_(pclose) {}
-  LineReader(LineReader&& other);
-  LineReader(const LineReader&) = delete;
-  LineReader& operator=(const LineReader&);
-
-
-  ~LineReader() { Close(); }
-
-  LineIterator begin();
-  LineIterator end();
-
-  void Next();
-
-  const std::string& line() const { return line_; }
-  bool eof() { return eof_; }
-
- private:
-  void Close();
-
-  FILE* file_;
-  std::string line_;
-  bool eof_ = false;
-  bool pclose_;
-};
-
-class LineIterator {
- public:
-  LineIterator(LineReader* reader) : reader_(reader) {}
-
-  bool operator!=(const LineIterator& /*other*/) const {
-    // Hack for range-based for.
-    return !reader_->eof();
-  }
-
-  void operator++() { reader_->Next(); }
-
-  const std::string& operator*() const {
-    return reader_->line();
-  }
-
- private:
-  LineReader* reader_;
-};
-
-LineReader ReadLinesFromPipe(const std::string& cmd);
-
 // Demangle C++ symbols according to the Itanium ABI.  The |source| argument
 // controls what demangling mode we are using.
 std::string ItaniumDemangle(absl::string_view symbol, DataSource source);

diff --git a/src/disassemble.cc b/src/disassemble.cc
index 6e9cdc4..4f5d2f3 100644
--- a/src/disassemble.cc
+++ b/src/disassemble.cc

@@ -53,6 +53,7 @@
   }
 
   if (info.text.size() == 0) {
+    cs_close(&handle);
     THROW("Tried to disassemble empty function.");
   }
 

diff --git a/src/dwarf.cc b/src/dwarf.cc
index 938f20e..d062c55 100644
--- a/src/dwarf.cc
+++ b/src/dwarf.cc

@@ -34,6 +34,9 @@
 #include "bloaty.pb.h"
 #include "dwarf_constants.h"
 #include "util.h"
+#include "dwarf/attr.h"
+#include "dwarf/dwarf_util.h"
+#include "dwarf/line_info.h"
 
 using namespace dwarf2reader;
 using absl::string_view;
@@ -44,320 +47,6 @@
 
 namespace dwarf {
 
-int DivRoundUp(int n, int d) {
-  return (n + (d - 1)) / d;
-}
-
-namespace {
-
-// uint64/32 max is a tombstone value added by https://reviews.llvm.org/D81784.
-bool IsValidDwarfAddress(uint64_t addr, uint8_t address_size) {
-  if (addr == 0)
-    return false;
-  if (address_size == 4 && addr == std::numeric_limits<uint32_t>::max())
-    return false;
-  if (address_size == 8 && addr == std::numeric_limits<uint64_t>::max())
-    return false;
-  return true;
-}
-
-}  // namespace
-
-// Low-level Parsing Routines //////////////////////////////////////////////////
-
-// For parsing the low-level values found in DWARF files.  These are the only
-// routines that touch the bytes of the input buffer directly.  Everything else
-// is layered on top of these.
-
-// Parses the LEB128 format defined by DWARF (both signed and unsigned
-// versions).
-
-uint64_t ReadLEB128Internal(bool is_signed, string_view* data) {
-  uint64_t ret = 0;
-  int shift = 0;
-  int maxshift = 70;
-  const char* ptr = data->data();
-  const char* limit = ptr + data->size();
-
-  while (ptr < limit && shift < maxshift) {
-    char byte = *(ptr++);
-    ret |= static_cast<uint64_t>(byte & 0x7f) << shift;
-    shift += 7;
-    if ((byte & 0x80) == 0) {
-      data->remove_prefix(ptr - data->data());
-      if (is_signed && shift < 64 && (byte & 0x40)) {
-        ret |= -(1ULL << shift);
-      }
-      return ret;
-    }
-  }
-
-  THROW("corrupt DWARF data, unterminated LEB128");
-}
-
-template <typename T>
-T ReadLEB128(string_view* data) {
-  typedef typename std::conditional<std::is_signed<T>::value, int64_t,
-                                    uint64_t>::type Int64Type;
-  Int64Type val = ReadLEB128Internal(std::is_signed<T>::value, data);
-  if (val > std::numeric_limits<T>::max() ||
-      val < std::numeric_limits<T>::min()) {
-    THROW("DWARF data contained larger LEB128 than we were expecting");
-  }
-  return static_cast<T>(val);
-}
-
-void SkipLEB128(string_view* data) {
-  size_t limit =
-      std::min(static_cast<size_t>(data->size()), static_cast<size_t>(10));
-  for (size_t i = 0; i < limit; i++) {
-    if (((*data)[i] & 0x80) == 0) {
-      data->remove_prefix(i + 1);
-      return;
-    }
-  }
-
-  THROW("corrupt DWARF data, unterminated LEB128");
-}
-
-// Some size information attached to each compilation unit.  The size of an
-// address or offset in the DWARF data depends on this state which is parsed
-// from the header.
-class CompilationUnitSizes {
- public:
-  // When true, DWARF offsets are 64 bits, otherwise they are 32 bit.
-  bool dwarf64() const { return dwarf64_; }
-
-  // The size of addresses.  Guaranteed to be either 4 or 8.
-  uint8_t address_size() const { return address_size_; }
-
-  // DWARF version of this unit.
-  uint8_t dwarf_version() const { return dwarf_version_; }
-
-  uint64_t addr_base() const { return addr_base_; }
-  uint64_t str_offsets_base() const { return str_offsets_base_; }
-  uint64_t range_lists_base() const { return range_lists_base_; }
-
-  void SetAddressSize(uint8_t address_size) {
-    if (address_size != 4 && address_size != 8) {
-      THROWF("Unexpected address size: $0", address_size);
-    }
-    address_size_ = address_size;
-  }
-
-  void SetAddrBase(uint64_t addr_base) {
-    addr_base_ = addr_base;
-  }
-
-  void SetStrOffsetsBase(uint64_t str_offsets_base) {
-    str_offsets_base_ = str_offsets_base;
-  }
-
-  void SetRangeListsBase(uint64_t range_lists_base) {
-    range_lists_base_ = range_lists_base;
-  }
-
-  // To allow this as the key in a map.
-  bool operator<(const CompilationUnitSizes& rhs) const {
-    return std::tie(dwarf64_, address_size_) <
-           std::tie(rhs.dwarf64_, rhs.address_size_);
-  }
-
-  // Reads a DWARF offset based on whether we are reading dwarf32 or dwarf64
-  // format.
-  uint64_t ReadDWARFOffset(string_view* data) const {
-    if (dwarf64_) {
-      return ReadFixed<uint64_t>(data);
-    } else {
-      return ReadFixed<uint32_t>(data);
-    }
-  }
-
-  // Reads an address according to the expected address_size.
-  uint64_t ReadAddress(string_view* data) const {
-    if (address_size_ == 8) {
-      return ReadFixed<uint64_t>(data);
-    } else if (address_size_ == 4) {
-      return ReadFixed<uint32_t>(data);
-    } else {
-      BLOATY_UNREACHABLE();
-    }
-  }
-
-  uint64_t GetMaxAddress() const {
-    if (address_size_ == 8) {
-      return UINT64_MAX;
-    } else if (address_size_ == 4) {
-      return UINT32_MAX;
-    } else {
-      BLOATY_UNREACHABLE();
-    }
-  }
-
-  // Reads an "initial length" as specified in many DWARF headers.  This
-  // contains either a 32-bit or a 64-bit length, and signals whether we are
-  // using the 32-bit or 64-bit DWARF format (so it sets dwarf64 appropriately).
-  //
-  // Returns the range for this section and stores the remaining data
-  // in |remaining|.
-  string_view ReadInitialLength(string_view* remaining) {
-    uint64_t len = ReadFixed<uint32_t>(remaining);
-
-    if (len == 0xffffffff) {
-      dwarf64_ = true;
-      len = ReadFixed<uint64_t>(remaining);
-    } else {
-      dwarf64_ = false;
-    }
-
-    if (remaining->size() < len) {
-      THROW("short DWARF compilation unit");
-    }
-
-    string_view unit = *remaining;
-    unit.remove_suffix(remaining->size() - len);
-    *remaining = remaining->substr(len);
-    return unit;
-  }
-
-  void ReadDWARFVersion(string_view* data) {
-    dwarf_version_ = ReadFixed<uint16_t>(data);
-  }
-
- private:
-  uint16_t dwarf_version_;
-  bool dwarf64_;
-  uint8_t address_size_;
-  uint64_t addr_base_ = 0;
-  uint64_t str_offsets_base_ = 0;
-  uint64_t range_lists_base_ = 0;
-};
-
-
-// AbbrevTable /////////////////////////////////////////////////////////////////
-
-// Parses and stores a representation of (a portion of) the .debug_abbrev
-// section of a DWARF file.  An abbreviation is defined by a unique "code"
-// (unique within one table), and defines the DIE tag and set of attributes.
-// The encoding of the DIE then contains just the abbreviation code and the
-// attribute values -- thanks to the abbreviation table, the tag and attribute
-// keys/names are not required.
-//
-// The abbreviations are an internal detail of the DWARF format and users should
-// not need to care about them.
-
-class AbbrevTable {
- public:
-  // Reads abbreviations until a terminating abbreviation is seen.
-  string_view ReadAbbrevs(string_view data);
-
-  // In a DWARF abbreviation, each attribute has a name and a form.
-  struct Attribute {
-    uint16_t name;
-    uint8_t form;
-  };
-
-  // The representation of a single abbreviation.
-  struct Abbrev {
-    uint32_t code;
-    uint16_t tag;
-    bool has_child;
-    std::vector<Attribute> attr;
-  };
-
-  bool IsEmpty() const { return abbrev_.empty(); }
-
-  // Looks for an abbreviation with the given code.  Returns true if the lookup
-  // succeeded.
-  bool GetAbbrev(uint32_t code, const Abbrev** abbrev) const {
-    auto it = abbrev_.find(code);
-    if (it != abbrev_.end()) {
-      *abbrev = &it->second;
-      return true;
-    } else {
-      return false;
-    }
-  }
-
- private:
-  // Keyed by abbreviation code.
-  // Generally we expect these to be small, so we could almost use a vector<>.
-  // But you never know what crazy input data is going to do...
-  std::unordered_map<uint32_t, Abbrev> abbrev_;
-};
-
-string_view AbbrevTable::ReadAbbrevs(string_view data) {
-  while (true) {
-    uint32_t code = ReadLEB128<uint32_t>(&data);
-
-    if (code == 0) {
-      return data;  // Terminator entry.
-    }
-
-    Abbrev& abbrev = abbrev_[code];
-
-    if (abbrev.code) {
-      THROW("DWARF data contained duplicate abbrev code");
-    }
-
-    uint8_t has_child;
-
-    abbrev.code = code;
-    abbrev.tag = ReadLEB128<uint16_t>(&data);
-    has_child = ReadFixed<uint8_t>(&data);
-
-    switch (has_child) {
-      case DW_children_yes:
-        abbrev.has_child = true;
-        break;
-      case DW_children_no:
-        abbrev.has_child = false;
-        break;
-      default:
-        THROWF("DWARF has_child is neither true nor false: $0, code=$1, tag=$2",
-               has_child, abbrev.code, abbrev.tag);
-    }
-
-    while (true) {
-      Attribute attr;
-      attr.name = ReadLEB128<uint16_t>(&data);
-      attr.form = ReadLEB128<uint8_t>(&data);
-
-      if (attr.name == 0 && attr.form == 0) {
-        break;  // End of this abbrev
-      }
-
-      abbrev.attr.push_back(attr);
-    }
-  }
-}
-
-
-// StringTable /////////////////////////////////////////////////////////////////
-
-// Represents the .debug_str portion of a DWARF file and contains code for
-// reading strings out of it.  This is an internal detail of the DWARF format
-// and users should not need to care about it.
-
-class StringTable {
- public:
-  // Construct with the debug_str data from a DWARF file.
-  StringTable(string_view debug_str) : debug_str_(debug_str) {}
-
-  // Read a string from the table.
-  string_view ReadEntry(size_t ofs) const;
-
- private:
-  string_view debug_str_;
-};
-
-string_view StringTable::ReadEntry(size_t ofs) const {
-  string_view str = debug_str_;
-  SkipBytes(ofs, &str);
-  return ReadNullTerminated(&str);
-}
-
-
 // AddressRanges ///////////////////////////////////////////////////////////////
 
 // Code for reading address ranges out of .debug_aranges.
@@ -372,6 +61,8 @@
   // Address and length for this range.
   uint64_t address() { return address_; }
   uint64_t length() { return length_; }
+  // The range of the file where this data occurs.
+  string_view data() { return data_; }
 
   // Advance to the next range.  The values will be available in address() and
   // length().  Returns false when the end of this compilation unit is hit.
@@ -386,6 +77,7 @@
 
  private:
   CompilationUnitSizes sizes_;
+  string_view data_;
   string_view section_;
   string_view unit_remaining_;
   string_view next_unit_;
@@ -399,8 +91,10 @@
     return false;
   }
 
+  const char* start = unit_remaining_.data();
   address_ = sizes_.ReadAddress(&unit_remaining_);
   length_ = sizes_.ReadAddress(&unit_remaining_);
+  data_ = string_view(start, unit_remaining_.data() - start);
   return true;
 }
 
@@ -477,625 +171,16 @@
   return available.substr(0, list.read_offset() - available.data());
 }
 
-// DIEReader ///////////////////////////////////////////////////////////////////
-
-// Reads a sequence of DWARF DIE's (Debugging Information Entries) from the
-// .debug_info or .debug_types section of a binary.
-//
-// Each DIE contains a tag and a set of attribute/value pairs.  We rely on the
-// abbreviations in an AbbrevTable to decode the DIEs.
-
-class DIEReader {
- public:
-  // Constructs a new DIEReader.  Cannot be used until you call one of the
-  // Seek() methods below.
-  DIEReader(const File& file) : dwarf_(file) {}
-  DIEReader(const DIEReader&) = delete;
-  DIEReader& operator=(const DIEReader&) = delete;
-
-  // Returns true if we are at the end of DIEs for this compilation unit.
-  bool IsEof() const { return state_ == State::kEof; }
-
-  // DIEs exist in both .debug_info and .debug_types.
-  enum class Section {
-    kDebugInfo,
-    kDebugTypes
-  };
-
-  // Seeks to the overall start or the start of a specific compilation unit.
-  // Note that |header_offset| is the offset of the compilation unit *header*,
-  // not the offset of the first DIE.
-  bool SeekToCompilationUnit(Section section, uint64_t header_offset);
-  bool SeekToStart(Section section) {
-    return SeekToCompilationUnit(section, 0);
-  }
-
-  bool NextCompilationUnit();
-
-  // Advances to the next overall DIE, ignoring whether it happens to be a
-  // child, a sibling, or an uncle/aunt.  Returns false at error or EOF.
-  bool NextDIE();
-
-  // Skips children of the current DIE, so that the next call to NextDIE()
-  // will read the next sibling (or parent, if no sibling exists).
-  bool SkipChildren();
-
-  const AbbrevTable::Abbrev& GetAbbrev() const {
-    assert(!IsEof());
-    return *current_abbrev_;
-  }
-
-  // Returns the current read offset within the current compilation unit.
-  int64_t GetReadOffset() const { return remaining_.data() - start_; }
-
-  int GetDepth() const { return depth_; }
-
-  // Returns the tag of the current DIE.
-  // Requires that ReadCode() has been called at least once.
-  uint16_t GetTag() const { return GetAbbrev().tag; }
-
-  // Returns whether the current DIE has a child.
-  // Requires that ReadCode() has been called at least once.
-  bool HasChild() const { return GetAbbrev().has_child; }
-
-  template <class T>
-  void ReadAttributes(T&& func);
-
-  const File& dwarf() const { return dwarf_; }
-
-  string_view unit_range() const { return unit_range_; }
-  const CompilationUnitSizes& unit_sizes() const { return unit_sizes_; }
-  uint32_t abbrev_version() const { return abbrev_version_; }
-  uint64_t debug_abbrev_offset() const { return debug_abbrev_offset_; }
-
-  // If both compileunit_name and strp_sink are set, this will automatically
-  // call strp_sink->AddFileRange(compileunit_name, <string range>) for every
-  // DW_FORM_strp attribute encountered.  These strings occur in the .debug_str
-  // section.
-  void set_compileunit_name(absl::string_view name) {
-    unit_name_ = std::string(name);
-  }
-  void set_strp_sink(RangeSink* sink) { strp_sink_ = sink; }
-
-  void AddIndirectString(string_view range) const {
-    if (strp_sink_) {
-      strp_sink_->AddFileRange("dwarf_strp", unit_name_, range);
-    }
-  }
-
-  CompilationUnitSizes* mutable_unit_sizes() { return &unit_sizes_; }
-
- private:
-  // Internal APIs.
-
-  bool ReadCompilationUnitHeader();
-  bool ReadCode();
-  void SkipNullEntries();
-
-  enum class State {
-    kReadyToReadAttributes,
-    kReadyToNext,
-    kEof,
-  } state_;
-
-  std::string error_;
-
-  const File& dwarf_;
-  RangeSink* strp_sink_ = nullptr;
-  const char *start_ = nullptr;
-
-  // Abbreviation for the current entry.
-  const AbbrevTable::Abbrev* current_abbrev_;
-
-  // Our current read position.
-  string_view remaining_;
-  uint64_t sibling_offset_;
-  int depth_ = 0;
-
-  // Data for the next compilation unit.
-  string_view next_unit_;
-
-  // All of the AbbrevTables we've read from .debug_abbrev, indexed by their
-  // offset within .debug_abbrev.
-  std::unordered_map<uint64_t, AbbrevTable> abbrev_tables_;
-
-  // Whether we are in .debug_types or .debug_info.
-  Section section_;
-
-  // Information about the current compilation unit.
-  uint64_t debug_abbrev_offset_;
-  std::string unit_name_;
-  string_view unit_range_;
-  UnitType unit_type_;
-  uint64_t dwo_id_;
-  CompilationUnitSizes unit_sizes_;
-  AbbrevTable* unit_abbrev_;
-
-  // A small integer that uniquely identifies the combination of unit_abbrev_
-  // and unit_sizes_.  Attribute readers use this to know when they can reuse an
-  // existing (abbrev code) -> (Actions) mapping, since this table depends on
-  // both the current abbrev. table and the sizes.
-  uint32_t abbrev_version_;
-
-  std::map<std::pair<AbbrevTable*, CompilationUnitSizes>, size_t>
-      abbrev_versions_;
-
-  // Only for .debug_types
-  uint64_t unit_type_signature_;
-  uint64_t unit_type_offset_;
-};
-
-class AttrValue {
- public:
-  static AttrValue ParseAttr(const DIEReader &reader, uint8_t form,
-                             string_view *data);
-
-  AttrValue(const AttrValue &) = default;
-  AttrValue &operator=(const AttrValue &) = default;
-
-  bool IsUint() const {
-    return type_ == Type::kUint || type_ == Type::kUnresolvedUint;
-  }
-
-  bool IsString() const {
-    return type_ == Type::kString || type_ == Type::kUnresolvedString;
-  }
-
-  absl::optional<uint64_t> ToUint(const DIEReader& reader) const {
-    if (IsUint()) return GetUint(reader);
-    string_view str = GetString(reader);
-    switch (str.size()) {
-      case 1:
-        return ReadFixed<uint8_t>(&str);
-      case 2:
-        return ReadFixed<uint8_t>(&str);
-      case 4:
-        return ReadFixed<uint32_t>(&str);
-      case 8:
-        return ReadFixed<uint64_t>(&str);
-    }
-    return absl::nullopt;
-  }
-
-  uint64_t GetUint(const DIEReader& reader) const {
-    if (type_ == Type::kUnresolvedUint) {
-      return ResolveIndirectAddress(reader);
-    } else {
-      assert(type_ == Type::kUint);
-      return uint_;
-    }
-  }
-
-  string_view GetString(const DIEReader& reader) const {
-    if (type_ == Type::kUnresolvedString) {
-      return ResolveDoubleIndirectString(reader);
-    } else {
-      assert(type_ == Type::kString);
-      return string_;
-    }
-  }
-
-  void SetForm(uint16_t form) {
-    form_ = form;
-  }
-
-  uint16_t form() const { return form_; }
-
-  std::string DebugString() const {
-    if (type_ == Type::kUint) {
-      return absl::Substitute("AttrValue{type_=Type::kUint, form_=$0, uint_=$1}", form_, uint_);
-    } else {
-      return absl::Substitute("AttrValue{type_=Type::kString, form_=$0, string_=$1}", form_, string_);
-    }
-  }
-
- private:
-  explicit AttrValue(uint64_t val) : uint_(val), type_(Type::kUint) {}
-  explicit AttrValue(string_view val) : string_(val), type_(Type::kString) {}
-  
-  // Some attribute values remain unresolved after being parsed.
-  // We have to delay the resolution of some indirect values because they are
-  // dependent on bases that come after it in the sequence of attributes, eg.
-  //
-  // $ dwarfdump -i bloaty
-  //   COMPILE_UNIT<header overall offset = 0x00000000>:
-  // < 0><0x0000000c>  DW_TAG_compile_unit
-  //                     DW_AT_producer              (indexed string: 0x00000000)Debian clang version 11.0.1-2
-  //                     DW_AT_language              DW_LANG_C_plus_plus_14
-  //                     DW_AT_name                  (indexed string: 0x00000001)../src/main.cc
-  //                     DW_AT_str_offsets_base      0x00000008
-  //
-  // Note that DW_AT_name comes before DW_AT_str_offset_base, but the latter
-  // value is required to resolve the name attribute.
-  enum class Type {
-    kUint,
-    kString,
-    kUnresolvedUint,
-    kUnresolvedString
-  };
-
-  Type type() const { return type_; }
-
-  static AttrValue UnresolvedUint(uint64_t val) {
-     AttrValue ret(val);
-     ret.type_ = Type::kUnresolvedUint;
-     return ret;
-  }
-
-  static AttrValue UnresolvedString(uint64_t val) {
-     AttrValue ret(val);
-     ret.type_ = Type::kUnresolvedString;
-     return ret;
-  }
-
-  union {
-    uint64_t uint_;
-    string_view string_;
-  };
-
-  Type type_;
-  uint16_t form_;
-
-  template <class D>
-  static string_view ReadBlock(string_view* data);
-  static string_view ReadVariableBlock(string_view* data);
-  template <class D>
-  static string_view ReadIndirectString(const DIEReader &reader,
-                                        string_view *data);
-  static string_view ResolveIndirectString(const DIEReader &reader,
-                                           uint64_t ofs);
-
-  string_view ResolveDoubleIndirectString(const DIEReader &reader) const;
-  uint64_t ResolveIndirectAddress(const DIEReader& reader) const;
-};
-
-uint64_t ReadIndirectAddress(const DIEReader& reader, uint64_t val) {
-  string_view addrs = reader.dwarf().debug_addr;
-  const dwarf::CompilationUnitSizes& sizes = reader.unit_sizes();
-  switch (sizes.address_size()) {
-    case 4:
-      SkipBytes((val * 4) + sizes.addr_base(), &addrs);
-      return ReadFixed<uint32_t>(&addrs);
-    case 8:
-      SkipBytes((val * 8) + sizes.addr_base(), &addrs);
-      return ReadFixed<uint64_t>(&addrs);
-    default:
-      BLOATY_UNREACHABLE();
-  }
-}
-
-template <class D>
-string_view AttrValue::ReadBlock(string_view* data) {
-  D len = ReadFixed<D>(data);
-  return ReadBytes(len, data);
-}
-
-string_view AttrValue::ReadVariableBlock(string_view* data) {
-  uint64_t len = ReadLEB128<uint64_t>(data);
-  return ReadBytes(len, data);
-}
-
-string_view AttrValue::ResolveIndirectString(const DIEReader &reader,
-                                             uint64_t ofs) {
-  StringTable table(reader.dwarf().debug_str);
-  string_view ret = table.ReadEntry(ofs);
-  reader.AddIndirectString(ret);
-  return ret;
-}
-
-template <class D>
-string_view AttrValue::ReadIndirectString(const DIEReader &reader,
-                                          string_view *data) {
-  return ResolveIndirectString(reader, ReadFixed<D>(data));
-}
-
-string_view
-AttrValue::ResolveDoubleIndirectString(const DIEReader &reader) const {
-  uint64_t ofs = uint_;
-  string_view offsets = reader.dwarf().debug_str_offsets;
-  uint64_t ofs2;
-  if (reader.unit_sizes().dwarf64()) {
-    SkipBytes((ofs * 8) + reader.unit_sizes().str_offsets_base(), &offsets);
-    ofs2 = ReadFixed<uint64_t>(&offsets);
-  } else {
-    SkipBytes((ofs * 4) + reader.unit_sizes().str_offsets_base(), &offsets);
-    ofs2 = ReadFixed<uint32_t>(&offsets);
-  }
-  StringTable table(reader.dwarf().debug_str);
-  string_view ret = table.ReadEntry(ofs2);
-  reader.AddIndirectString(ret);
-  return ret;
-}
-
-uint64_t AttrValue::ResolveIndirectAddress(const DIEReader& reader) const {
-  return ReadIndirectAddress(reader, uint_);
-}
-
-AttrValue AttrValue::ParseAttr(const DIEReader &reader, uint8_t form,
-                               string_view *data) {
-  switch (form) {
-    case DW_FORM_indirect: {
-      uint16_t indirect_form = ReadLEB128<uint16_t>(data);
-      if (indirect_form == DW_FORM_indirect) {
-        THROW("indirect attribute has indirect form type");
-      }
-      return ParseAttr(reader, indirect_form, data);
-    }
-    case DW_FORM_ref1:
-      return AttrValue(ReadFixed<uint8_t>(data));
-    case DW_FORM_ref2:
-      return AttrValue(ReadFixed<uint16_t>(data));
-    case DW_FORM_ref4:
-      return AttrValue(ReadFixed<uint32_t>(data));
-    case DW_FORM_ref_sig8:
-    case DW_FORM_ref8:
-      return AttrValue(ReadFixed<uint64_t>(data));
-    case DW_FORM_ref_udata:
-    case DW_FORM_strx1:
-      return AttrValue::UnresolvedString(ReadFixed<uint8_t>(data));
-    case DW_FORM_strx2:
-      return AttrValue::UnresolvedString(ReadFixed<uint16_t>(data));
-    case DW_FORM_strx4:
-      return AttrValue::UnresolvedString(ReadFixed<uint32_t>(data));
-    case DW_FORM_strx:
-      return AttrValue::UnresolvedString(ReadLEB128<uint64_t>(data));
-    case DW_FORM_addrx1:
-      return AttrValue::UnresolvedUint(ReadFixed<uint8_t>(data));
-    case DW_FORM_addrx2:
-      return AttrValue::UnresolvedUint(ReadFixed<uint16_t>(data));
-    case DW_FORM_addrx3:
-      return AttrValue::UnresolvedUint(ReadFixed<uint32_t, 3>(data));
-    case DW_FORM_addrx4:
-      return AttrValue::UnresolvedUint(ReadFixed<uint32_t>(data));
-    case DW_FORM_addrx:
-      return AttrValue::UnresolvedUint(ReadLEB128<uint64_t>(data));
-    case DW_FORM_addr:
-    address_size:
-      switch (reader.unit_sizes().address_size()) {
-        case 4:
-          return AttrValue(ReadFixed<uint32_t>(data));
-        case 8:
-          return AttrValue(ReadFixed<uint64_t>(data));
-        default:
-          BLOATY_UNREACHABLE();
-      }
-    case DW_FORM_ref_addr:
-      if (reader.unit_sizes().dwarf_version() <= 2) {
-        goto address_size;
-      }
-      ABSL_FALLTHROUGH_INTENDED;
-    case DW_FORM_sec_offset:
-      if (reader.unit_sizes().dwarf64()) {
-        return AttrValue(ReadFixed<uint64_t>(data));
-      } else {
-        return AttrValue(ReadFixed<uint32_t>(data));
-      }
-    case DW_FORM_udata:
-      return AttrValue(ReadLEB128<uint64_t>(data));
-    case DW_FORM_block1:
-      return AttrValue(ReadBlock<uint8_t>(data));
-    case DW_FORM_block2:
-      return AttrValue(ReadBlock<uint16_t>(data));
-    case DW_FORM_block4:
-      return AttrValue(ReadBlock<uint32_t>(data));
-    case DW_FORM_block:
-    case DW_FORM_exprloc:
-      return AttrValue(ReadVariableBlock(data));
-    case DW_FORM_string:
-      return AttrValue(ReadNullTerminated(data));
-    case DW_FORM_strp:
-      if (reader.unit_sizes().dwarf64()) {
-        return AttrValue(ReadIndirectString<uint64_t>(reader, data));
-      } else {
-        return AttrValue(ReadIndirectString<uint32_t>(reader, data));
-      }
-    case DW_FORM_data1:
-      return AttrValue(ReadBytes(1, data));
-    case DW_FORM_data2:
-      return AttrValue(ReadBytes(2, data));
-    case DW_FORM_data4:
-      return AttrValue(ReadBytes(4, data));
-    case DW_FORM_data8:
-      return AttrValue(ReadBytes(8, data));
-    case DW_FORM_loclistx:
-    case DW_FORM_rnglistx:
-      return AttrValue(ReadLEB128<uint64_t>(data));
-
-    // Bloaty doesn't currently care about any bool or signed data.
-    // So we fudge it a bit and just stuff these in a uint64.
-    case DW_FORM_flag_present:
-      return AttrValue(1);
-    case DW_FORM_flag:
-      return AttrValue(ReadFixed<uint8_t>(data));
-    case DW_FORM_sdata:
-      return AttrValue(ReadLEB128<uint64_t>(data));
-    default:
-      THROWF("Don't know how to parse DWARF form: $0", form);
-  }
-}
-
-void DIEReader::SkipNullEntries() {
-  while (!remaining_.empty() && remaining_[0] == 0) {
-    // null entry terminates a chain of sibling entries.
-    remaining_.remove_prefix(1);
-    depth_--;
-  }
-}
-
-bool DIEReader::ReadCode() {
-  SkipNullEntries();
-  if (remaining_.empty()) {
-    state_ = State::kEof;
-    return false;
-  }
-  uint32_t code = ReadLEB128<uint32_t>(&remaining_);
-  if (!unit_abbrev_->GetAbbrev(code, &current_abbrev_)) {
-    THROW("couldn't find abbreviation for code");
-  }
-  state_ = State::kReadyToReadAttributes;
-  sibling_offset_ = 0;
-
-  if (HasChild()) {
-    depth_++;
-  }
-
-  return true;
-}
-
-bool DIEReader::NextCompilationUnit() {
-  return ReadCompilationUnitHeader();
-}
-
-bool DIEReader::NextDIE() {
-  if (state_ == State::kEof) {
-    return false;
-  }
-
-  assert(state_ == State::kReadyToNext);
-  return ReadCode();
-}
-
-bool DIEReader::SeekToCompilationUnit(Section section, uint64_t offset) {
-  section_ = section;
-
-  if (section == Section::kDebugInfo) {
-    next_unit_ = dwarf_.debug_info;
-  } else {
-    next_unit_ = dwarf_.debug_types;
-  }
-
-  start_ = next_unit_.data();
-  SkipBytes(offset, &next_unit_);
-  return ReadCompilationUnitHeader();
-}
-
-bool DIEReader::ReadCompilationUnitHeader() {
-  if (next_unit_.empty()) {
-    state_ = State::kEof;
-    return false;
-  }
-
-  unit_range_ = next_unit_;
-  remaining_ = unit_sizes_.ReadInitialLength(&next_unit_);
-  unit_range_ = unit_range_.substr(
-      0, remaining_.size() + (remaining_.data() - unit_range_.data()));
-
-  unit_sizes_.ReadDWARFVersion(&remaining_);
-
-  if (unit_sizes_.dwarf_version() > 5) {
-    THROWF("Data for $0 is in DWARF $1 format which we don't understand",
-        unit_name_, unit_sizes_.dwarf_version());
-  }
-
-  if (unit_sizes_.dwarf_version() == 5) {
-    unit_type_ = static_cast<UnitType>(ReadFixed<uint8_t>(&remaining_));
-    unit_sizes_.SetAddressSize(ReadFixed<uint8_t>(&remaining_));
-    debug_abbrev_offset_ = unit_sizes_.ReadDWARFOffset(&remaining_);
-    switch (unit_type_) {
-    case DW_UT_skeleton:
-    case DW_UT_split_compile:
-    case DW_UT_split_type:
-      dwo_id_ = ReadFixed<uint64_t>(&remaining_);
-      break;
-    case DW_UT_type:
-      unit_type_signature_ = ReadFixed<uint64_t>(&remaining_);
-      unit_type_offset_ = unit_sizes_.ReadDWARFOffset(&remaining_);
-      break;
-    case DW_UT_compile:
-    case DW_UT_partial:
-      break;
-#if defined(_GNUC)
-    case DW_UT_lo_user ... DW_UT_hi_user:
-#else
-    case DW_UT_lo_user:
-    case DW_UT_hi_user:
-#endif
-      // User defined unit types which we do not really know about ...
-      if (verbose_level > 0) {
-        fprintf(stderr, "Unknown DWARF Unit Type in user defined range\n");
-      }
-      break;
-    }
-  } else {
-    debug_abbrev_offset_ = unit_sizes_.ReadDWARFOffset(&remaining_);
-    unit_sizes_.SetAddressSize(ReadFixed<uint8_t>(&remaining_));
-
-    if (section_ == Section::kDebugTypes) {
-      unit_type_signature_ = ReadFixed<uint64_t>(&remaining_);
-      unit_type_offset_ = unit_sizes_.ReadDWARFOffset(&remaining_);
-    }
-  }
-
-  unit_abbrev_ = &abbrev_tables_[debug_abbrev_offset_];
-
-  // If we haven't already read abbreviations for this debug_abbrev_offset_, we
-  // need to do so now.
-  if (unit_abbrev_->IsEmpty()) {
-    string_view abbrev_data = dwarf_.debug_abbrev;
-    SkipBytes(debug_abbrev_offset_, &abbrev_data);
-    unit_abbrev_->ReadAbbrevs(abbrev_data);
-  }
-
-  auto abbrev_id = std::make_pair(unit_abbrev_, unit_sizes_);
-  auto insert_pair = abbrev_versions_.insert(
-      std::make_pair(abbrev_id, abbrev_versions_.size()));
-
-  // This will be either the newly inserted value or the existing one, if there
-  // was one.
-  abbrev_version_ = insert_pair.first->second;
-
-  return ReadCode();
-}
-
-bool DIEReader::SkipChildren() {
-  assert(state_ == State::kReadyToNext);
-  if (!HasChild()) {
-    return true;
-  }
-
-  int target_depth = depth_ - 1;
-  SkipNullEntries();
-  while (depth_ > target_depth) {
-    // TODO(haberman): use DW_AT_sibling to optimize skipping when it is
-    // available.
-    if (!NextDIE()) {
-      return false;
-    }
-    ReadAttributes([](uint16_t, dwarf::AttrValue) {});
-    SkipNullEntries();
-  }
-  return true;
-}
-
-// Reads all attributes for this DIE, storing the ones we were expecting.
-template <class T>
-void DIEReader::ReadAttributes(T&& func) {
-  assert(state_ == State::kReadyToReadAttributes);
-
-  for (auto attr : GetAbbrev().attr) {
-    AttrValue value = AttrValue::ParseAttr(*this, attr.form, &remaining_);
-    value.SetForm(attr.form);
-    func(attr.name, value);
-  }
-
-  if (remaining_.data() == nullptr) {
-    THROW("premature EOF reading DWARF attributes");
-  } else {
-    sibling_offset_ = 0;
-    state_ = State::kReadyToNext;
-  }
-}
-
 // RangeList ///////////////////////////////////////////////////////////////////
 
-void ReadRangeList(const DIEReader& die_reader, uint64_t low_pc,
-                   string_view name, RangeSink* sink, string_view* data) {
+void ReadRangeList(const CU& cu, uint64_t low_pc, string_view name,
+                   RangeSink* sink, string_view* data) {
   std::string name_str(name);
-  uint64_t max_address = die_reader.unit_sizes().GetMaxAddress();
+  uint64_t max_address = cu.unit_sizes().MaxAddress();
   while (true) {
     uint64_t start, end;
-    start = die_reader.unit_sizes().ReadAddress(data);
-    end = die_reader.unit_sizes().ReadAddress(data);
+    start = cu.unit_sizes().ReadAddress(data);
+    end = cu.unit_sizes().ReadAddress(data);
     if (start == 0 && end == 0) {
       return;
     } else if (start == max_address) {
@@ -1108,335 +193,6 @@
   }
 }
 
-// LineInfoReader //////////////////////////////////////////////////////////////
-
-// Code to read the .line_info programs in a DWARF file.
-
-class LineInfoReader {
- public:
-  LineInfoReader(const File& file) : file_(file), info_(0) {}
-
-  struct LineInfo {
-    LineInfo(bool default_is_stmt) : is_stmt(default_is_stmt) {}
-    uint64_t address = 0;
-    uint32_t file = 1;
-    uint32_t line = 1;
-    uint32_t column = 0;
-    uint32_t discriminator = 0;
-    bool end_sequence = false;
-    bool basic_block = false;
-    bool prologue_end = false;
-    bool epilogue_begin = false;
-    bool is_stmt;
-    uint8_t op_index = 0;
-    uint8_t isa = 0;
-  };
-
-  struct FileName {
-    string_view name;
-    uint32_t directory_index;
-    uint64_t modified_time;
-    uint64_t file_size;
-  };
-
-  void SeekToOffset(uint64_t offset, uint8_t address_size);
-  bool ReadLineInfo();
-  const LineInfo& lineinfo() const { return info_; }
-  const FileName& filename(size_t i) const { return filenames_[i]; }
-  string_view include_directory(size_t i) const {
-    return include_directories_[i];
-  }
-
-  const std::string& GetExpandedFilename(size_t index) {
-    if (index >= filenames_.size()) {
-      THROW("filename index out of range");
-    }
-
-    // Generate these lazily.
-    if (expanded_filenames_.size() <= index) {
-      expanded_filenames_.resize(filenames_.size());
-    }
-
-    std::string& ret = expanded_filenames_[index];
-    if (ret.empty()) {
-      const FileName& filename = filenames_[index];
-      string_view directory = include_directories_[filename.directory_index];
-      ret = std::string(directory);
-      if (!ret.empty()) {
-        ret += "/";
-      }
-      ret += std::string(filename.name);
-    }
-    return ret;
-  }
-
- private:
-  struct Params {
-    uint8_t minimum_instruction_length;
-    uint8_t maximum_operations_per_instruction;
-    uint8_t default_is_stmt;
-    int8_t line_base;
-    uint8_t line_range;
-    uint8_t opcode_base;
-  } params_;
-
-  const File& file_;
-
-  CompilationUnitSizes sizes_;
-  std::vector<string_view> include_directories_;
-  std::vector<FileName> filenames_;
-  std::vector<uint8_t> standard_opcode_lengths_;
-  std::vector<std::string> expanded_filenames_;
-
-  string_view remaining_;
-
-  // Whether we are in a "shadow" part of the bytecode program.  Sometimes
-  // parts of the line info program make it into the final binary even though
-  // the corresponding code was stripped.  We can tell when this happened by
-  // looking for DW_LNE_set_address ops where the operand is 0.  This
-  // indicates that a relocation for that argument never got applied, which
-  // probably means that the code got stripped.
-  //
-  // While this is true, we don't yield any LineInfo entries, because the
-  // "address" value is garbage.
-  bool shadow_;
-
-  LineInfo info_;
-
-  void DoAdvance(uint64_t advance, uint8_t max_per_instr) {
-    info_.address += params_.minimum_instruction_length *
-                     ((info_.op_index + advance) / max_per_instr);
-    info_.op_index = (info_.op_index + advance) % max_per_instr;
-  }
-
-  void Advance(uint64_t amount) {
-    if (params_.maximum_operations_per_instruction == 1) {
-      // This is by far the common case (only false on VLIW architectuers),
-      // and this inlining/specialization avoids a costly division.
-      DoAdvance(amount, 1);
-    } else {
-      DoAdvance(amount, params_.maximum_operations_per_instruction);
-    }
-  }
-
-  uint8_t AdjustedOpcode(uint8_t op) { return op - params_.opcode_base; }
-
-  void SpecialOpcodeAdvance(uint8_t op) {
-    Advance(AdjustedOpcode(op) / params_.line_range);
-  }
-};
-
-void LineInfoReader::SeekToOffset(uint64_t offset, uint8_t address_size) {
-  string_view data = file_.debug_line;
-  SkipBytes(offset, &data);
-
-  sizes_.SetAddressSize(address_size);
-  data = sizes_.ReadInitialLength(&data);
-  sizes_.ReadDWARFVersion(&data);
-  uint64_t header_length = sizes_.ReadDWARFOffset(&data);
-  string_view program = data;
-  SkipBytes(header_length, &program);
-
-  params_.minimum_instruction_length = ReadFixed<uint8_t>(&data);
-  if (sizes_.dwarf_version() == 4) {
-    params_.maximum_operations_per_instruction = ReadFixed<uint8_t>(&data);
-
-    if (params_.maximum_operations_per_instruction == 0) {
-      THROW("DWARF line info had maximum_operations_per_instruction=0");
-    }
-  } else {
-    params_.maximum_operations_per_instruction = 1;
-  }
-  params_.default_is_stmt = ReadFixed<uint8_t>(&data);
-  params_.line_base = ReadFixed<int8_t>(&data);
-  params_.line_range = ReadFixed<uint8_t>(&data);
-  params_.opcode_base = ReadFixed<uint8_t>(&data);
-  if (params_.line_range == 0) {
-    THROW("line_range of zero will cause divide by zero");
-  }
-
-  standard_opcode_lengths_.resize(params_.opcode_base);
-  for (size_t i = 1; i < params_.opcode_base; i++) {
-    standard_opcode_lengths_[i] = ReadFixed<uint8_t>(&data);
-  }
-
-  // Read include_directories.
-  include_directories_.clear();
-
-  // Implicit current directory entry.
-  include_directories_.push_back(string_view());
-
-  while (true) {
-    string_view dir = ReadNullTerminated(&data);
-    if (dir.empty()) {
-      break;
-    }
-    include_directories_.push_back(dir);
-  }
-
-  // Read file_names.
-  filenames_.clear();
-  expanded_filenames_.clear();
-
-  // Filename 0 is unused.
-  filenames_.push_back(FileName());
-  while (true) {
-    FileName file_name;
-    file_name.name = ReadNullTerminated(&data);
-    if (file_name.name.empty()) {
-      break;
-    }
-    file_name.directory_index = ReadLEB128<uint32_t>(&data);
-    file_name.modified_time = ReadLEB128<uint64_t>(&data);
-    file_name.file_size = ReadLEB128<uint64_t>(&data);
-    if (file_name.directory_index >= include_directories_.size()) {
-      THROW("directory index out of range");
-    }
-    filenames_.push_back(file_name);
-  }
-
-  info_ = LineInfo(params_.default_is_stmt);
-  remaining_ = program;
-  shadow_ = false;
-}
-
-bool LineInfoReader::ReadLineInfo() {
-  // Final step of last DW_LNS_copy / special opcode.
-  info_.discriminator = 0;
-  info_.basic_block = false;
-  info_.prologue_end = false;
-  info_.epilogue_begin = false;
-
-  // Final step of DW_LNE_end_sequence.
-  info_.end_sequence = false;
-
-  string_view data = remaining_;
-
-  while (true) {
-    if (data.empty()) {
-      remaining_ = data;
-      return false;
-    }
-
-    uint8_t op = ReadFixed<uint8_t>(&data);
-
-    if (op >= params_.opcode_base) {
-      SpecialOpcodeAdvance(op);
-      info_.line +=
-          params_.line_base + (AdjustedOpcode(op) % params_.line_range);
-      if (!shadow_) {
-        remaining_ = data;
-        return true;
-      }
-    } else {
-      switch (op) {
-        case DW_LNS_extended_op: {
-          uint16_t len = ReadLEB128<uint16_t>(&data);
-          uint8_t extended_op = ReadFixed<uint8_t>(&data);
-          switch (extended_op) {
-            case DW_LNE_end_sequence: {
-              // Preserve address and set end_sequence, but reset everything
-              // else.
-              uint64_t addr = info_.address;
-              info_ = LineInfo(params_.default_is_stmt);
-              info_.address = addr;
-              info_.end_sequence = true;
-              if (!shadow_) {
-                remaining_ = data;
-                return true;
-              }
-              break;
-            }
-            case DW_LNE_set_address:
-              info_.address = sizes_.ReadAddress(&data);
-              info_.op_index = 0;
-              shadow_ = (info_.address == 0);
-              break;
-            case DW_LNE_define_file: {
-              FileName file_name;
-              file_name.name = ReadNullTerminated(&data);
-              file_name.directory_index = ReadLEB128<uint32_t>(&data);
-              file_name.modified_time = ReadLEB128<uint64_t>(&data);
-              file_name.file_size = ReadLEB128<uint64_t>(&data);
-              if (file_name.directory_index >= include_directories_.size()) {
-                THROW("directory index out of range");
-              }
-              filenames_.push_back(file_name);
-              break;
-            }
-            case DW_LNE_set_discriminator:
-              info_.discriminator = ReadLEB128<uint32_t>(&data);
-              break;
-            default:
-              // We don't understand this opcode, skip it.
-              SkipBytes(len, &data);
-              if (verbose_level > 0) {
-                fprintf(stderr,
-                        "bloaty: warning: unknown DWARF line table extended "
-                        "opcode: %d\n",
-                        extended_op);
-              }
-              break;
-          }
-          break;
-        }
-        case DW_LNS_copy:
-          if (!shadow_) {
-            remaining_ = data;
-            return true;
-          }
-          break;
-        case DW_LNS_advance_pc:
-          Advance(ReadLEB128<uint64_t>(&data));
-          break;
-        case DW_LNS_advance_line:
-          info_.line += ReadLEB128<int32_t>(&data);
-          break;
-        case DW_LNS_set_file:
-          info_.file = ReadLEB128<uint32_t>(&data);
-          if (info_.file >= filenames_.size()) {
-            THROW("filename index too big");
-          }
-          break;
-        case DW_LNS_set_column:
-          info_.column = ReadLEB128<uint32_t>(&data);
-          break;
-        case DW_LNS_negate_stmt:
-          info_.is_stmt = !info_.is_stmt;
-          break;
-        case DW_LNS_set_basic_block:
-          info_.basic_block = true;
-          break;
-        case DW_LNS_const_add_pc:
-          SpecialOpcodeAdvance(255);
-          break;
-        case DW_LNS_fixed_advance_pc:
-          info_.address += ReadFixed<uint16_t>(&data);
-          info_.op_index = 0;
-          break;
-        case DW_LNS_set_prologue_end:
-          info_.prologue_end = true;
-          break;
-        case DW_LNS_set_epilogue_begin:
-          info_.epilogue_begin = true;
-          break;
-        case DW_LNS_set_isa:
-          info_.isa = ReadLEB128<uint8_t>(&data);
-          break;
-        default:
-          // Unknown opcode, but we know its length so can skip it.
-          SkipBytes(standard_opcode_lengths_[op], &data);
-          if (verbose_level > 0) {
-            fprintf(stderr,
-                    "bloaty: warning: unknown DWARF line table opcode: %d\n",
-                    op);
-          }
-          break;
-      }
-    }
-  }
-}
-
 string_view* File::GetFieldByName(string_view name) {
   if (name == "aranges") {
     return &debug_aranges;
@@ -1484,7 +240,7 @@
   class FilenameMap {
    public:
     FilenameMap(const dwarf::File& file)
-        : die_reader_(file),
+        : info_reader_(file),
           missing_("[DWARF is missing filename]") {}
 
     std::string GetFilename(uint64_t compilation_unit_offset) {
@@ -1496,39 +252,27 @@
     }
 
    private:
-    bool ReadName(string_view* name, uint64_t offset) {
-      auto sec = dwarf::DIEReader::Section::kDebugInfo;
-      if (!die_reader_.SeekToCompilationUnit(sec, offset) ||
-          die_reader_.GetTag() != DW_TAG_compile_unit) {
+    bool ReadName(std::string* name, uint64_t offset) {
+      auto sec = dwarf::InfoReader::Section::kDebugInfo;
+      dwarf::CUIter iter = info_reader_.GetCUIter(sec, offset);
+      dwarf::CU cu;
+      if (!iter.NextCU(info_reader_, &cu)) {
           return false;
       }
-
-      absl::optional<dwarf::AttrValue> attr;
-
-      die_reader_.ReadAttributes([&attr](uint16_t tag, dwarf::AttrValue data) {
-        if (tag == DW_AT_name && data.IsString()) {
-          attr = data;
-        }
-      });
-      
-      if (attr && attr->IsString()) {
-        *name = attr->GetString(die_reader_);
-        return true;
-      } else {
-        return false;
-      }
+      *name = cu.unit_name();
+      return true;
     }
 
     std::string LookupFilename(uint64_t compilation_unit_offset) {
-      string_view name;
+      std::string name;
       if (ReadName(&name, compilation_unit_offset)) {
-        return std::string(name);
+        return name;
       } else {
         return missing_;
       }
     }
 
-    dwarf::DIEReader die_reader_;
+    dwarf::InfoReader info_reader_;
     std::unordered_map<uint64_t, std::string> map_;
     std::string missing_;
   } map(file);
@@ -1543,6 +287,7 @@
         sink->AddVMRangeIgnoreDuplicate("dwarf_aranges", ranges.address(),
                                         ranges.length(), filename);
       }
+      sink->AddFileRange("dwarf_aranges_data", filename, ranges.data());
     }
   }
 
@@ -1550,134 +295,129 @@
 }
 
 struct GeneralDIE {
-  absl::optional<dwarf::AttrValue> name;
-  absl::optional<dwarf::AttrValue> linkage_name;
-  absl::optional<dwarf::AttrValue> declaration;
-  absl::optional<dwarf::AttrValue> location;
-  absl::optional<dwarf::AttrValue> low_pc;
-  absl::optional<dwarf::AttrValue> high_pc;
-  absl::optional<dwarf::AttrValue> stmt_list;
-  absl::optional<dwarf::AttrValue> ranges;
-  absl::optional<dwarf::AttrValue> start_scope;
+  absl::optional<string_view> name;
+  absl::optional<string_view> location_string;
+  absl::optional<uint64_t> location_uint64;
+  absl::optional<uint64_t> low_pc;
+  absl::optional<uint64_t> high_pc_addr;
+  absl::optional<uint64_t> high_pc_size;
+  absl::optional<uint64_t> stmt_list;
+  absl::optional<uint64_t> rnglistx;
+  absl::optional<uint64_t> ranges;
+  absl::optional<uint64_t> start_scope;
+  bool declaration = false;
 };
 
-void ReadGeneralDIEAttr(uint16_t tag, dwarf::AttrValue val, GeneralDIE *die) {
+void ReadGeneralDIEAttr(uint16_t tag, dwarf::AttrValue val, const dwarf::CU& cu,
+                        GeneralDIE* die) {
   switch (tag) {
     case DW_AT_name:
-      die->name = val;
-      break;
-    case DW_AT_linkage_name:
-      die->linkage_name = val;
+      if (val.IsString()) {
+        die->name = val.GetString(cu);
+      }
       break;
     case DW_AT_declaration:
-      die->declaration = val;
+      if (auto uint = val.ToUint(cu)) {
+        die->declaration = *uint;
+      }
       break;
     case DW_AT_location:
-      die->location = val;
+      if (val.IsString()) {
+        die->location_string = val.GetString(cu);
+      } else if (val.form() == DW_FORM_sec_offset) {
+        die->location_uint64 = val.GetUint(cu);
+      }
       break;
     case DW_AT_low_pc:
-      die->low_pc = val;
+      if (auto uint = val.ToUint(cu)) {
+        die->low_pc = *uint;
+      }
       break;
     case DW_AT_high_pc:
-      die->high_pc = val;
+      switch (val.form()) {
+        case DW_FORM_addr:
+        case DW_FORM_addrx:
+        case DW_FORM_addrx1:
+        case DW_FORM_addrx2:
+        case DW_FORM_addrx3:
+        case DW_FORM_addrx4:
+          // high_pc is absolute.
+          die->high_pc_addr = val.GetUint(cu);
+          break;
+        case DW_FORM_data1:
+        case DW_FORM_data2:
+        case DW_FORM_data4:
+        case DW_FORM_data8:
+          // high_pc is a size.
+          die->high_pc_size = val.ToUint(cu);
+          break;
+        default:
+          if (verbose_level > 0) {
+            fprintf(stderr, "Unexpected form for high_pc: %d\n", val.form());
+          }
+          break;
+      }
       break;
     case DW_AT_stmt_list:
-      die->stmt_list = val;
+      if (auto uint = val.ToUint(cu)) {
+        die->stmt_list = *uint;
+      }
       break;
     case DW_AT_ranges:
-      die->ranges = val;
+      if (auto uint = val.ToUint(cu)) {
+        if (val.form() == DW_FORM_rnglistx) {
+          die->rnglistx = *uint;
+        } else {
+          die->ranges = *uint;
+        }
+      }
       break;
     case DW_AT_start_scope:
-      die->start_scope = val;
+      if (auto uint = val.ToUint(cu)) {
+        die->start_scope = *uint;
+      }
       break;
   }
 }
 
-class InlinesDIE {
- public:
-  bool has_stmt_list() const { return has_stmt_list_; }
-
-  uint64_t stmt_list() const { return stmt_list_; }
-
-  void set_stmt_list(uint64_t val) {
-    has_stmt_list_ = true;
-    stmt_list_ = val;
-  }
-
- private:
-  bool has_stmt_list_ = false;
-  uint64_t stmt_list_ = 0;
-};
-
-uint64_t TryReadPcPair(const std::string& name, const GeneralDIE& die,
-                       const dwarf::DIEReader& die_reader, RangeSink* sink) {
-  if (!die.low_pc || !die.high_pc || !die.low_pc->IsUint()) return 0;
-
-  uint64_t low_pc = die.low_pc->GetUint(die_reader);
-  uint8_t address_size = die_reader.unit_sizes().address_size();
-  if (!dwarf::IsValidDwarfAddress(low_pc, address_size)) return 0;
-
+uint64_t TryReadPcPair(const dwarf::CU& cu, const GeneralDIE& die,
+                       RangeSink* sink) {
+  uint64_t addr;
   uint64_t size;
 
-  switch (die.high_pc->form()) {
-    case DW_FORM_addr:
-    case DW_FORM_addrx:
-    case DW_FORM_addrx1:
-    case DW_FORM_addrx2:
-    case DW_FORM_addrx3:
-    case DW_FORM_addrx4:
-      // high_pc is absolute.
-      size = die.high_pc->GetUint(die_reader) - low_pc;
-      break;
-    case DW_FORM_data1:
-    case DW_FORM_data2:
-    case DW_FORM_data4:
-    case DW_FORM_data8:
-      // high_pc is a size.
-      size = *die.high_pc->ToUint(die_reader);
-      break;
-    default:
-      if (verbose_level > 0) {
-        fprintf(stderr, "Unexpected form for high_pc: %d\n", die.high_pc->form());
-      }
-      return 0;
+  if (!die.low_pc) return 0;
+  addr = *die.low_pc;
+
+  if (die.high_pc_addr) {
+    size = *die.high_pc_addr - addr;
+  } else if (die.high_pc_size) {
+    size = *die.high_pc_size;
+  } else{
+    return 0;
   }
 
-  sink->AddVMRangeIgnoreDuplicate("dwarf_pcpair", low_pc, size, name);
-  return low_pc;
+  sink->AddVMRangeIgnoreDuplicate("dwarf_pcpair", addr, size, cu.unit_name());
+  return addr;
 }
 
 // To view DIEs for a given file, try:
 //   readelf --debug-dump=info foo.bin
-void AddDIE(const dwarf::File& file, const std::string& name,
-            const GeneralDIE& die, const SymbolTable& symtab,
-            const DualMap& symbol_map, const dwarf::DIEReader& die_reader,
-            RangeSink* sink) {
-  uint64_t low_pc = TryReadPcPair(name, die, die_reader, sink);
-
-  // Sometimes a DIE has a linkage_name, which we can look up in the symbol
-  // table.
-  if (die.linkage_name && die.linkage_name->IsString()) {
-    auto linkage_name = die.linkage_name->GetString(die_reader);
-    auto it = symtab.find(linkage_name);
-    if (it != symtab.end()) {
-      sink->AddVMRangeIgnoreDuplicate("dwarf_linkagename", it->second.first,
-                                      it->second.second, name);
-    }
-  }
+void AddDIE(const dwarf::CU& cu, const GeneralDIE& die,
+            const DualMap& symbol_map, RangeSink* sink) {
+  uint64_t low_pc = TryReadPcPair(cu, die, sink);
 
   // Sometimes the DIE has a "location", which gives the location as an address.
   // This parses a very small subset of the overall DWARF expression grammar.
-  if (die.location && die.location->IsString()) {
-    string_view location = die.location->GetString(die_reader);
-    if (location.size() == die_reader.unit_sizes().address_size() + 1 &&
+  if (die.location_string) {
+    string_view location = *die.location_string;
+    if (location.size() == cu.unit_sizes().address_size() + 1 &&
         location[0] == DW_OP_addr) {
       location.remove_prefix(1);
       uint64_t addr;
       // TODO(haberman): endian?
-      if (die_reader.unit_sizes().address_size() == 4) {
+      if (cu.unit_sizes().address_size() == 4) {
         addr = ReadFixed<uint32_t>(&location);
-      } else if (die_reader.unit_sizes().address_size() == 8) {
+      } else if (cu.unit_sizes().address_size() == 8) {
         addr = ReadFixed<uint64_t>(&location);
       } else {
         BLOATY_UNREACHABLE();
@@ -1687,82 +427,79 @@
       // up in the symbol map.
       uint64_t size;
       if (symbol_map.vm_map.TryGetSize(addr, &size)) {
-        sink->AddVMRangeIgnoreDuplicate("dwarf_location", addr, size, name);
+        sink->AddVMRangeIgnoreDuplicate("dwarf_location", addr, size,
+                                        cu.unit_name());
       } else {
         if (verbose_level > 0) {
           fprintf(stderr,
                   "bloaty: warning: couldn't find DWARF location in symbol "
                   "table, address: %" PRIx64 ", name: %s\n",
-                  addr, name.c_str());
+                  addr, cu.unit_name().c_str());
         }
       }
     }
   }
 
   // Sometimes a location is given as an offset into debug_loc.
-  if (die.location && die.location->IsUint()) {
-    uint64_t location = die.location->GetUint(die_reader);
-    if (die.location->form() == DW_FORM_sec_offset) {
-      if (location < file.debug_loc.size()) {
-        absl::string_view loc_range = file.debug_loc.substr(location);
-        loc_range = GetLocationListRange(die_reader.unit_sizes(), loc_range);
-        sink->AddFileRange("dwarf_locrange", name, loc_range);
-      } else if (verbose_level > 0) {
-        fprintf(
-            stderr,
-            "bloaty: warning: DWARF location out of range, location=%" PRIx64
-            "\n",
-            location);
-      }
+  if (die.location_uint64) {
+    uint64_t location = *die.location_uint64;;
+    if (location < cu.dwarf().debug_loc.size()) {
+      absl::string_view loc_range = cu.dwarf().debug_loc.substr(location);
+      loc_range = GetLocationListRange(cu.unit_sizes(), loc_range);
+      sink->AddFileRange("dwarf_locrange", cu.unit_name(), loc_range);
+    } else if (verbose_level > 0) {
+      fprintf(stderr,
+              "bloaty: warning: DWARF location out of range, location=%" PRIx64
+              "\n",
+              location);
     }
   }
 
   // DWARF 5 range list is the same information as "ranges" but in a different
   // format.
-  if (die.ranges && die.ranges->form() == DW_FORM_rnglistx && die.ranges->IsUint()) {
-    uint64_t range_list = die.ranges->GetUint(die_reader);
-    const dwarf::CompilationUnitSizes& sizes = die_reader.unit_sizes();
-    size_t offset_size = die_reader.unit_sizes().dwarf64() ? 8 : 4;
-    string_view offset_data = StrictSubstr(
-        file.debug_rnglists, die_reader.unit_sizes().range_lists_base() +
-                                 (range_list * offset_size));
-    uint64_t offset = die_reader.unit_sizes().ReadDWARFOffset(&offset_data);
+  if (die.rnglistx) {
+    uint64_t range_list = *die.rnglistx;
+    size_t offset_size = cu.unit_sizes().dwarf64() ? 8 : 4;
+    string_view offset_data =
+        StrictSubstr(cu.dwarf().debug_rnglists,
+                     cu.range_lists_base() + (range_list * offset_size));
+    uint64_t offset = cu.unit_sizes().ReadDWARFOffset(&offset_data);
     string_view data = StrictSubstr(
-        file.debug_rnglists, die_reader.unit_sizes().range_lists_base() + offset);
+        cu.dwarf().debug_rnglists, cu.range_lists_base() + offset);
     const char* start = data.data();
     bool done = false;
-    uint64_t base_address = sizes.addr_base();
+    uint64_t base_address = cu.addr_base();
     while (!done) {
       switch (ReadFixed<uint8_t>(&data)) {
         case DW_RLE_end_of_list:
           done = true;
           break;
         case DW_RLE_base_addressx:
-          base_address = ReadIndirectAddress(
-              die_reader, dwarf::ReadLEB128<uint64_t>(&data));
+          base_address =
+              ReadIndirectAddress(cu, dwarf::ReadLEB128<uint64_t>(&data));
           break;
         case DW_RLE_startx_endx: {
-          uint64_t start = ReadIndirectAddress(
-              die_reader, dwarf::ReadLEB128<uint64_t>(&data));
-          uint64_t end = ReadIndirectAddress(
-              die_reader, dwarf::ReadLEB128<uint64_t>(&data));
+          uint64_t start =
+              ReadIndirectAddress(cu, dwarf::ReadLEB128<uint64_t>(&data));
+          uint64_t end =
+              ReadIndirectAddress(cu, dwarf::ReadLEB128<uint64_t>(&data));
           sink->AddVMRangeIgnoreDuplicate("dwarf_rangelst", start, end - start,
-                                          name);
+                                          cu.unit_name());
           break;
         }
         case DW_RLE_startx_length: {
-          uint64_t start = ReadIndirectAddress(
-              die_reader, dwarf::ReadLEB128<uint64_t>(&data));
+          uint64_t start =
+              ReadIndirectAddress(cu, dwarf::ReadLEB128<uint64_t>(&data));
           uint64_t length = dwarf::ReadLEB128<uint64_t>(&data);
           sink->AddVMRangeIgnoreDuplicate("dwarf_rangelst", start, length,
-                                          name);
+                                          cu.unit_name());
           break;
         }
         case DW_RLE_offset_pair: {
           uint64_t start = dwarf::ReadLEB128<uint64_t>(&data) + base_address;
           uint64_t end = dwarf::ReadLEB128<uint64_t>(&data) + base_address;
           sink->AddVMRangeIgnoreDuplicate("dwarf_rangelst", start, end - start,
-                                          name);
+                                          cu.unit_name());
           break;
         }
         case DW_RLE_base_address:
@@ -1773,25 +510,25 @@
       }
     }
     string_view all(start, data.data() - start);
-    sink->AddFileRange("dwarf_rangelst_addrs", name, all);
+    sink->AddFileRange("dwarf_rangelst_addrs", cu.unit_name(), all);
   } else {
     uint64_t ranges_offset = UINT64_MAX;
 
     // There are two different attributes that sometimes contain an offset into
     // debug_ranges.
-    if (die.ranges && die.ranges->IsUint()) {
-      ranges_offset = die.ranges->GetUint(die_reader);
-    } else if (die.start_scope && die.start_scope->IsUint()) {
-      ranges_offset = die.start_scope->GetUint(die_reader);
+    if (die.ranges) {
+      ranges_offset = *die.ranges;
+    } else if (die.start_scope) {
+      ranges_offset = *die.start_scope;
     }
 
     if (ranges_offset != UINT64_MAX) {
-      if (ranges_offset < file.debug_ranges.size()) {
-        absl::string_view data = file.debug_ranges.substr(ranges_offset);
+      if (ranges_offset < cu.dwarf().debug_ranges.size()) {
+        absl::string_view data = cu.dwarf().debug_ranges.substr(ranges_offset);
         const char* start = data.data();
-        ReadRangeList(die_reader, low_pc, name, sink, &data);
+        ReadRangeList(cu, low_pc, cu.unit_name(), sink, &data);
         string_view all(start, data.data() - start);
-        sink->AddFileRange("dwarf_debugrange", name, all);
+        sink->AddFileRange("dwarf_debugrange", cu.unit_name(), all);
       } else if (verbose_level > 0) {
         fprintf(stderr,
                 "bloaty: warning: DWARF debug range out of range, "
@@ -1802,9 +539,8 @@
   }
 }
 
-static void ReadDWARFPubNames(const dwarf::File& file, string_view section,
+static void ReadDWARFPubNames(dwarf::InfoReader& reader, string_view section,
                               RangeSink* sink) {
-  dwarf::DIEReader die_reader(file);
   string_view remaining = section;
 
   while (remaining.size() > 0) {
@@ -1815,377 +551,84 @@
         full_unit.substr(0, unit.size() + (unit.data() - full_unit.data()));
     sizes.ReadDWARFVersion(&unit);
     uint64_t debug_info_offset = sizes.ReadDWARFOffset(&unit);
-    bool ok = die_reader.SeekToCompilationUnit(
-        dwarf::DIEReader::Section::kDebugInfo, debug_info_offset);
-    if (!ok) {
-      THROW("Couldn't seek to debug_info section");
-    }
-    string_view compileunit_name;
-    die_reader.ReadAttributes(
-        [&compileunit_name, &die_reader](uint16_t tag, dwarf::AttrValue data) {
-          if (tag == DW_AT_name && data.IsString()) {
-            compileunit_name = data.GetString(die_reader);
-          }
-        });
-    if (!compileunit_name.empty()) {
-      sink->AddFileRange("dwarf_pubnames", compileunit_name, full_unit);
+
+    dwarf::CUIter iter = reader.GetCUIter(
+        dwarf::InfoReader::Section::kDebugInfo, debug_info_offset);
+    dwarf::CU cu;
+    if (iter.NextCU(reader, &cu) && !cu.unit_name().empty()) {
+      sink->AddFileRange("dwarf_pubnames", cu.unit_name(), full_unit);
     }
   }
 }
 
-uint64_t ReadEncodedPointer(uint8_t encoding, bool is_64bit, string_view* data,
-                            const char* data_base, RangeSink* sink) {
-  uint64_t value;
-  const char* ptr = data->data();
-  uint8_t format = encoding & DW_EH_PE_FORMAT_MASK;
-
-  switch (format) {
-    case DW_EH_PE_omit:
-      return 0;
-    case DW_EH_PE_absptr:
-      if (is_64bit) {
-        value = ReadFixed<uint64_t>(data);
-      } else {
-        value = ReadFixed<uint32_t>(data);
-      }
-      break;
-    case DW_EH_PE_uleb128:
-      value = dwarf::ReadLEB128<uint64_t>(data);
-      break;
-    case DW_EH_PE_udata2:
-      value = ReadFixed<uint16_t>(data);
-      break;
-    case DW_EH_PE_udata4:
-      value = ReadFixed<uint32_t>(data);
-      break;
-    case DW_EH_PE_udata8:
-      value = ReadFixed<uint64_t>(data);
-      break;
-    case DW_EH_PE_sleb128:
-      value = dwarf::ReadLEB128<int64_t>(data);
-      break;
-    case DW_EH_PE_sdata2:
-      value = ReadFixed<int16_t>(data);
-      break;
-    case DW_EH_PE_sdata4:
-      value = ReadFixed<int32_t>(data);
-      break;
-    case DW_EH_PE_sdata8:
-      value = ReadFixed<int64_t>(data);
-      break;
-    default:
-      THROWF("Unexpected eh_frame format value: $0", format);
-  }
-
-  uint8_t application = encoding & DW_EH_PE_APPLICATION_MASK;
-
-  switch (application) {
-    case 0:
-      break;
-    case DW_EH_PE_pcrel:
-      value += sink->TranslateFileToVM(ptr);
-      break;
-    case DW_EH_PE_datarel:
-      if (data_base == nullptr) {
-        THROW("datarel requested but no data_base provided");
-      }
-      value += sink->TranslateFileToVM(data_base);
-      break;
-    case DW_EH_PE_textrel:
-    case DW_EH_PE_funcrel:
-    case DW_EH_PE_aligned:
-      THROWF("Unimplemented eh_frame application value: $0", application);
-  }
-
-  if (encoding & DW_EH_PE_indirect) {
-    string_view location = sink->TranslateVMToFile(value);
-    if (is_64bit) {
-      value = ReadFixed<uint64_t>(&location);
-    } else {
-      value = ReadFixed<uint32_t>(&location);
-    }
-  }
-
-  return value;
-}
-
-// Code to read the .eh_frame section.  This is not technically DWARF, but it
-// is similar to .debug_frame (which is DWARF) so it's convenient to put it
-// here.
-//
-// The best documentation I can find for this format comes from:
-//
-// *
-// http://refspecs.linuxfoundation.org/LSB_5.0.0/LSB-Core-generic/LSB-Core-generic/ehframechpt.html
-// * https://www.airs.com/blog/archives/460
-//
-// However these are both under-specified.  Some details are not mentioned in
-// either of these (for example, the fact that the function length uses the FDE
-// encoding, but always absolute).  libdwarf's implementation contains a comment
-// saying "It is not clear if this is entirely correct".  Basically the only
-// thing you can trust for some of these details is the code that actually
-// implements unwinding in production:
-//
-// * libunwind http://www.nongnu.org/libunwind/
-//   https://github.com/pathscale/libunwind/blob/master/src/dwarf/Gfde.c
-// * LLVM libunwind (a different project!!)
-//   https://github.com/llvm-mirror/libunwind/blob/master/src/DwarfParser.hpp
-// * libgcc
-//   https://github.com/gcc-mirror/gcc/blob/master/libgcc/unwind-dw2-fde.c
-void ReadEhFrame(string_view data, RangeSink* sink) {
-  string_view remaining = data;
-
-  struct CIEInfo {
-    int version = 0;
-    uint32_t code_align = 0;
-    int32_t data_align = 0;
-    uint8_t fde_encoding = 0;
-    uint8_t lsda_encoding = 0;
-    bool is_signal_handler = false;
-    bool has_augmentation_length = false;
-    uint64_t personality_function = 0;
-    uint32_t return_address_reg = 0;
-  };
-
-  std::unordered_map<const void*, CIEInfo> cie_map;
-
-  while (remaining.size() > 0) {
-    dwarf::CompilationUnitSizes sizes;
-    string_view full_entry = remaining;
-    string_view entry = sizes.ReadInitialLength(&remaining);
-    if (entry.size() == 0 && remaining.size() == 0) {
-      return;
-    }
-    full_entry =
-        full_entry.substr(0, entry.size() + (entry.data() - full_entry.data()));
-    uint32_t id = ReadFixed<uint32_t>(&entry);
-    if (id == 0) {
-      // CIE, we don't attribute this yet.
-      CIEInfo& cie_info = cie_map[full_entry.data()];
-      cie_info.version = ReadFixed<uint8_t>(&entry);
-      string_view aug_string = ReadNullTerminated(&entry);
-      cie_info.code_align = dwarf::ReadLEB128<uint32_t>(&entry);
-      cie_info.data_align = dwarf::ReadLEB128<int32_t>(&entry);
-      switch (cie_info.version) {
-        case 1:
-          cie_info.return_address_reg = ReadFixed<uint8_t>(&entry);
-          break;
-        case 3:
-          cie_info.return_address_reg = dwarf::ReadLEB128<uint32_t>(&entry);
-          break;
-        default:
-          THROW("Unexpected eh_frame CIE version");
-      }
-      while (aug_string.size() > 0) {
-        switch (aug_string[0]) {
-          case 'z':
-            // Length until the end of augmentation data.
-            cie_info.has_augmentation_length = true;
-            dwarf::ReadLEB128<uint32_t>(&entry);
-            break;
-          case 'L':
-            cie_info.lsda_encoding = ReadFixed<uint8_t>(&entry);
-            break;
-          case 'R':
-            cie_info.fde_encoding = ReadFixed<uint8_t>(&entry);
-            break;
-          case 'S':
-            cie_info.is_signal_handler = true;
-            break;
-          case 'P': {
-            uint8_t encoding = ReadFixed<uint8_t>(&entry);
-            cie_info.personality_function =
-                ReadEncodedPointer(encoding, true, &entry, nullptr, sink);
-            break;
-          }
-          default:
-            THROW("Unexepcted augmentation character");
-        }
-        aug_string.remove_prefix(1);
-      }
-    } else {
-      auto iter = cie_map.find(entry.data() - id - 4);
-      if (iter == cie_map.end()) {
-        THROW("Couldn't find CIE for FDE");
-      }
-      const CIEInfo& cie_info = iter->second;
-      // TODO(haberman): don't hard-code 64-bit.
-      uint64_t address = ReadEncodedPointer(cie_info.fde_encoding, true, &entry,
-                                            nullptr, sink);
-      // TODO(haberman); Technically the FDE addresses could span a
-      // function/compilation unit?  They can certainly span inlines.
-      /*
-      uint64_t length =
-        ReadEncodedPointer(cie_info.fde_encoding & 0xf, true, &entry, sink);
-      (void)length;
-
-      if (cie_info.has_augmentation_length) {
-        uint32_t augmentation_length = dwarf::ReadLEB128<uint32_t>(&entry);
-        (void)augmentation_length;
-      }
-
-      uint64_t lsda =
-          ReadEncodedPointer(cie_info.lsda_encoding, true, &entry, sink);
-      if (lsda) {
-      }
-      */
-
-      sink->AddFileRangeForVMAddr("dwarf_fde", address, full_entry);
-    }
-  }
-}
-
-// See documentation here:
-//   http://refspecs.linuxfoundation.org/LSB_5.0.0/LSB-Core-generic/LSB-Core-generic/ehframechpt.html#EHFRAME
-void ReadEhFrameHdr(string_view data, RangeSink* sink) {
-  const char* base = data.data();
-  uint8_t version = ReadFixed<uint8_t>(&data);
-  uint8_t eh_frame_ptr_enc = ReadFixed<uint8_t>(&data);
-  uint8_t fde_count_enc = ReadFixed<uint8_t>(&data);
-  uint8_t table_enc = ReadFixed<uint8_t>(&data);
-
-  if (version != 1) {
-    THROWF("Unknown eh_frame_hdr version: $0", version);
-  }
-
-  // TODO(haberman): don't hard-code 64-bit.
-  uint64_t eh_frame_ptr =
-      ReadEncodedPointer(eh_frame_ptr_enc, true, &data, base, sink);
-  (void)eh_frame_ptr;
-  uint64_t fde_count =
-      ReadEncodedPointer(fde_count_enc, true, &data, base, sink);
-
-  for (uint64_t i = 0; i < fde_count; i++) {
-    string_view entry_data = data;
-    uint64_t initial_location =
-        ReadEncodedPointer(table_enc, true, &data, base, sink);
-    uint64_t fde_addr = ReadEncodedPointer(table_enc, true, &data, base, sink);
-    entry_data.remove_suffix(data.size());
-    sink->AddFileRangeForVMAddr("dwarf_fde_table", initial_location,
-                                entry_data);
-
-    // We could add fde_addr with an unknown length if we wanted to skip reading
-    // eh_frame.  We can't count on this table being available though, so we
-    // don't want to remove the eh_frame reading code altogether.
-    (void)fde_addr;
-  }
-}
-
-static void ReadDWARFStmtListRange(const dwarf::File& file, uint64_t offset,
-                                   string_view unit_name, RangeSink* sink) {
-  string_view data = file.debug_line;
+static void ReadDWARFStmtListRange(const dwarf::CU& cu, uint64_t offset,
+                                   RangeSink* sink) {
+  string_view data = cu.dwarf().debug_line;
   SkipBytes(offset, &data);
   string_view data_with_length = data;
   dwarf::CompilationUnitSizes sizes;
   data = sizes.ReadInitialLength(&data);
   data = data_with_length.substr(
       0, data.size() + (data.data() - data_with_length.data()));
-  sink->AddFileRange("dwarf_stmtlistrange", unit_name, data);
+  sink->AddFileRange("dwarf_stmtlistrange", cu.unit_name(), data);
 }
 
 // The DWARF debug info can help us get compileunits info.  DIEs for compilation
 // units, functions, and global variables often have attributes that will
 // resolve to addresses.
-static void ReadDWARFDebugInfo(
-    const dwarf::File& file, dwarf::DIEReader::Section section,
-    const SymbolTable& symtab, const DualMap& symbol_map, RangeSink* sink,
-    std::unordered_map<uint64_t, std::string>* stmt_list_map) {
-  dwarf::DIEReader die_reader(file);
-  die_reader.set_strp_sink(sink);
+static void ReadDWARFDebugInfo(dwarf::InfoReader& reader,
+                               dwarf::InfoReader::Section section,
+                               const DualMap& symbol_map, RangeSink* sink) {
+  dwarf::CUIter iter = reader.GetCUIter(section);
+  dwarf::CU cu;
+  cu.SetIndirectStringCallback([sink, &cu](string_view str) {
+    sink->AddFileRange("dwarf_strp", cu.unit_name(), str);
+  });
 
-  if (!die_reader.SeekToStart(section)) {
-    return;
-  }
-
-  do {
+  while (iter.NextCU(reader, &cu)) {
+    dwarf::DIEReader die_reader = cu.GetDIEReader();
     GeneralDIE compileunit_die;
+    auto* abbrev = die_reader.ReadCode(cu);
     die_reader.ReadAttributes(
-        [&die_reader, &compileunit_die](uint16_t tag, dwarf::AttrValue value) {
-          switch (tag) {
-            case DW_AT_addr_base:
-              die_reader.mutable_unit_sizes()->SetAddrBase(value.GetUint(die_reader));
-              break;
-            case DW_AT_str_offsets_base:
-              die_reader.mutable_unit_sizes()->SetStrOffsetsBase(value.GetUint(die_reader));
-              break;
-            case DW_AT_rnglists_base:
-              die_reader.mutable_unit_sizes()->SetRangeListsBase(value.GetUint(die_reader));
-              break;
-            default:
-              ReadGeneralDIEAttr(tag, value, &compileunit_die);
-              break;
-            }
+        cu, abbrev,
+        [&cu, &compileunit_die](uint16_t tag, dwarf::AttrValue value) {
+          ReadGeneralDIEAttr(tag, value, cu, &compileunit_die);
         });
-    std::string compileunit_name;
-    if (compileunit_die.name && compileunit_die.name->IsString()) {
-      compileunit_name =
-          std::string(compileunit_die.name->GetString(die_reader));
-    }
 
-    uint64_t stmt_list = UINT64_MAX;
-
-    if (compileunit_die.stmt_list && compileunit_die.stmt_list->IsUint()) {
-      stmt_list = compileunit_die.stmt_list->GetUint(die_reader);
-      if (compileunit_name.empty()) {
-        auto iter = stmt_list_map->find(stmt_list);
-        if (iter != stmt_list_map->end()) {
-          compileunit_name = iter->second;
-        }
-      } else {
-        (*stmt_list_map)[stmt_list] = compileunit_name;
-      }
-    }
-
-    if (compileunit_name.empty()) {
+    if (cu.unit_name().empty()) {
       continue;
     }
 
-    die_reader.set_compileunit_name(compileunit_name);
-    sink->AddFileRange("dwarf_debuginfo", compileunit_name,
-                       die_reader.unit_range());
-    AddDIE(file, compileunit_name, compileunit_die, symtab, symbol_map,
-           die_reader, sink);
+    sink->AddFileRange("dwarf_debuginfo", cu.unit_name(), cu.entire_unit());
+    AddDIE(cu, compileunit_die, symbol_map, sink);
 
-    if (stmt_list != UINT64_MAX) {
-      ReadDWARFStmtListRange(file, stmt_list, compileunit_name, sink);
+    if (compileunit_die.stmt_list) {
+      ReadDWARFStmtListRange(cu, *compileunit_die.stmt_list, sink);
     }
 
-    string_view abbrev_data = file.debug_abbrev;
-    SkipBytes(die_reader.debug_abbrev_offset(), &abbrev_data);
-    dwarf::AbbrevTable unit_abbrev;
-    abbrev_data = unit_abbrev.ReadAbbrevs(abbrev_data);
-    sink->AddFileRange("dwarf_abbrev", compileunit_name, abbrev_data);
+    sink->AddFileRange("dwarf_abbrev", cu.unit_name(), cu.unit_abbrev().abbrev_data());
 
-    while (die_reader.NextDIE()) {
+    while (auto abbrev = die_reader.ReadCode(cu)) {
       GeneralDIE die;
-      die_reader.ReadAttributes([&die](uint16_t tag, dwarf::AttrValue value) {
-        ReadGeneralDIEAttr(tag, value, &die);
-      });
+      die_reader.ReadAttributes(
+          cu, abbrev, [&cu, &die](uint16_t tag, dwarf::AttrValue value) {
+            ReadGeneralDIEAttr(tag, value, cu, &die);
+          });
 
-      // If low_pc is present but not a valid address, it indicates this this
-      // entity was stripped from the binary, so we want to skip ti.
-      bool is_stripped =
-          die.low_pc && die.low_pc->IsUint() &&
-          !dwarf::IsValidDwarfAddress(die.low_pc->GetUint(die_reader),
-                                      die_reader.unit_sizes().address_size());
-
-      // A declaration is not a definition and should not be attributed to this
-      // compileunit.
-      bool is_decl = die.declaration && die.declaration->IsUint() &&
-          die.declaration->GetUint(die_reader);
-
-      if (is_stripped || is_decl) {
-        die_reader.SkipChildren();
+      // low_pc == 0 is a signal that this routine was stripped out of the
+      // final binary. Also any declaration should be skipped.
+      if ((die.low_pc && !cu.IsValidDwarfAddress(*die.low_pc)) ||
+          die.declaration) {
+        die_reader.SkipChildren(cu, abbrev);
       } else {
-        AddDIE(file, compileunit_name, die, symtab, symbol_map, die_reader,
-               sink);
+        AddDIE(cu, die, symbol_map, sink);
       }
     }
-  } while (die_reader.NextCompilationUnit());
+  }
 }
 
-void ReadDWARFCompileUnits(const dwarf::File& file, const SymbolTable& symtab,
-                           const DualMap& symbol_map, RangeSink* sink) {
+void ReadDWARFCompileUnits(const dwarf::File& file, const DualMap& symbol_map,
+                           RangeSink* sink) {
   if (!file.debug_info.size()) {
     THROW("missing debug info");
   }
@@ -2194,13 +637,15 @@
     ReadDWARFAddressRanges(file, sink);
   }
 
-  std::unordered_map<uint64_t, std::string> stmt_list_map;
-  ReadDWARFDebugInfo(file, dwarf::DIEReader::Section::kDebugInfo, symtab,
-                     symbol_map, sink, &stmt_list_map);
-  ReadDWARFDebugInfo(file, dwarf::DIEReader::Section::kDebugTypes, symtab,
-                     symbol_map, sink, &stmt_list_map);
-  ReadDWARFPubNames(file, file.debug_pubnames, sink);
-  ReadDWARFPubNames(file, file.debug_pubtypes, sink);
+  // Share a reader to avoid re-parsing debug abbreviations.
+  dwarf::InfoReader reader(file);
+
+  ReadDWARFDebugInfo(reader, dwarf::InfoReader::Section::kDebugInfo, symbol_map,
+                     sink);
+  ReadDWARFDebugInfo(reader, dwarf::InfoReader::Section::kDebugTypes,
+                     symbol_map, sink);
+  ReadDWARFPubNames(reader, file.debug_pubnames, sink);
+  ReadDWARFPubNames(reader, file.debug_pubtypes, sink);
 }
 
 static std::string LineInfoKey(const std::string& file, uint32_t line,
@@ -2249,35 +694,29 @@
     THROW("no debug info");
   }
 
-  dwarf::DIEReader die_reader(file);
+  dwarf::InfoReader reader(file);
+  dwarf::CUIter iter = reader.GetCUIter(dwarf::InfoReader::Section::kDebugInfo);
+  dwarf::CU cu;
+  dwarf::DIEReader die_reader = cu.GetDIEReader();
   dwarf::LineInfoReader line_info_reader(file);
 
-  if (!die_reader.SeekToStart(dwarf::DIEReader::Section::kDebugInfo)) {
+  if (!iter.NextCU(reader, &cu)) {
     THROW("debug info is present, but empty");
   }
 
-  while (true) {
-    InlinesDIE die;
+  while (auto abbrev = die_reader.ReadCode(cu)) {
+    absl::optional<uint64_t> stmt_list;
     die_reader.ReadAttributes(
-        [&die, &die_reader](uint16_t tag, dwarf::AttrValue val) {
-          switch (tag) {
-          case DW_AT_stmt_list:
-            if (auto uint = val.ToUint(die_reader))
-              die.set_stmt_list(uint.value());
-            break;
+        cu, abbrev, [&stmt_list, &cu](uint16_t tag, dwarf::AttrValue val) {
+          if (tag == DW_AT_stmt_list) {
+            stmt_list = val.ToUint(cu);
           }
         });
 
-    if (die.has_stmt_list()) {
-      uint64_t offset = die.stmt_list();
-      line_info_reader.SeekToOffset(offset,
-                                    die_reader.unit_sizes().address_size());
+    if (stmt_list) {
+      line_info_reader.SeekToOffset(*stmt_list, cu.unit_sizes().address_size());
       ReadDWARFStmtList(include_line, &line_info_reader, sink);
     }
-
-    if (!die_reader.NextCompilationUnit()) {
-      return;
-    }
   }
 }
 

diff --git a/src/dwarf/attr.cc b/src/dwarf/attr.cc
new file mode 100644
index 0000000..6cb359c
--- /dev/null
+++ b/src/dwarf/attr.cc

@@ -0,0 +1,208 @@
+// Copyright 2016 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "dwarf/attr.h"
+
+#include "dwarf/debug_info.h"
+#include "dwarf/dwarf_util.h"
+#include "dwarf_constants.h"
+#include "util.h"
+
+using string_view = absl::string_view;
+using namespace dwarf2reader;
+
+namespace bloaty {
+namespace dwarf {
+
+absl::optional<uint64_t> AttrValue::ToUint(const CU& cu) const {
+  if (IsUint()) return GetUint(cu);
+  string_view str = GetString(cu);
+  switch (str.size()) {
+    case 1:
+      return ReadFixed<uint8_t>(&str);
+    case 2:
+      return ReadFixed<uint8_t>(&str);
+    case 4:
+      return ReadFixed<uint32_t>(&str);
+    case 8:
+      return ReadFixed<uint64_t>(&str);
+  }
+  return absl::nullopt;
+}
+
+uint64_t AttrValue::GetUint(const CU& cu) const {
+  if (type_ == Type::kUnresolvedUint) {
+    return ResolveIndirectAddress(cu);
+  } else {
+    assert(type_ == Type::kUint);
+    return uint_;
+  }
+}
+
+string_view AttrValue::GetString(const CU& cu) const {
+  if (type_ == Type::kUnresolvedString) {
+    return ResolveDoubleIndirectString(cu);
+  } else {
+    assert(type_ == Type::kString);
+    return string_;
+  }
+}
+
+template <class D>
+string_view AttrValue::ReadBlock(string_view* data) {
+  D len = ReadFixed<D>(data);
+  return ReadBytes(len, data);
+}
+
+string_view AttrValue::ReadVariableBlock(string_view* data) {
+  uint64_t len = ReadLEB128<uint64_t>(data);
+  return ReadBytes(len, data);
+}
+
+string_view AttrValue::ResolveIndirectString(const CU& cu, uint64_t ofs) {
+  string_view ret = ReadDebugStrEntry(cu.dwarf().debug_str, ofs);
+  cu.AddIndirectString(ret);
+  return ret;
+}
+
+template <class D>
+string_view AttrValue::ReadIndirectString(const CU& cu, string_view* data) {
+  return ResolveIndirectString(cu, ReadFixed<D>(data));
+}
+
+string_view
+AttrValue::ResolveDoubleIndirectString(const CU &cu) const {
+  uint64_t ofs = uint_;
+  string_view offsets = cu.dwarf().debug_str_offsets;
+  uint64_t ofs2;
+  if (cu.unit_sizes().dwarf64()) {
+    SkipBytes((ofs * 8) + cu.str_offsets_base(), &offsets);
+    ofs2 = ReadFixed<uint64_t>(&offsets);
+  } else {
+    SkipBytes((ofs * 4) + cu.str_offsets_base(), &offsets);
+    ofs2 = ReadFixed<uint32_t>(&offsets);
+  }
+  string_view ret = ReadDebugStrEntry(cu.dwarf().debug_str, ofs2);
+  cu.AddIndirectString(ret);
+  return ret;
+}
+
+uint64_t AttrValue::ResolveIndirectAddress(const CU& cu) const {
+  return ReadIndirectAddress(cu, uint_);
+}
+
+AttrValue AttrValue::ParseAttr(const CU& cu, uint8_t form, string_view* data) {
+  switch (form) {
+    case DW_FORM_indirect: {
+      uint16_t indirect_form = ReadLEB128<uint16_t>(data);
+      if (indirect_form == DW_FORM_indirect) {
+        THROW("indirect attribute has indirect form type");
+      }
+      return ParseAttr(cu, indirect_form, data);
+    }
+    case DW_FORM_ref1:
+      return AttrValue(form, ReadFixed<uint8_t>(data));
+    case DW_FORM_ref2:
+      return AttrValue(form, ReadFixed<uint16_t>(data));
+    case DW_FORM_ref4:
+      return AttrValue(form, ReadFixed<uint32_t>(data));
+    case DW_FORM_ref_sig8:
+    case DW_FORM_ref8:
+      return AttrValue(form, ReadFixed<uint64_t>(data));
+    case DW_FORM_ref_udata:
+    case DW_FORM_strx1:
+      return AttrValue::UnresolvedString(form, ReadFixed<uint8_t>(data));
+    case DW_FORM_strx2:
+      return AttrValue::UnresolvedString(form, ReadFixed<uint16_t>(data));
+    case DW_FORM_strx4:
+      return AttrValue::UnresolvedString(form, ReadFixed<uint32_t>(data));
+    case DW_FORM_strx:
+      return AttrValue::UnresolvedString(form, ReadLEB128<uint64_t>(data));
+    case DW_FORM_addrx1:
+      return AttrValue::UnresolvedUint(form, ReadFixed<uint8_t>(data));
+    case DW_FORM_addrx2:
+      return AttrValue::UnresolvedUint(form, ReadFixed<uint16_t>(data));
+    case DW_FORM_addrx3:
+      return AttrValue::UnresolvedUint(form, ReadFixed<uint32_t, 3>(data));
+    case DW_FORM_addrx4:
+      return AttrValue::UnresolvedUint(form, ReadFixed<uint32_t>(data));
+    case DW_FORM_addrx:
+      return AttrValue::UnresolvedUint(form, ReadLEB128<uint64_t>(data));
+    case DW_FORM_addr:
+    address_size:
+      switch (cu.unit_sizes().address_size()) {
+        case 4:
+          return AttrValue(form, ReadFixed<uint32_t>(data));
+        case 8:
+          return AttrValue(form, ReadFixed<uint64_t>(data));
+        default:
+          BLOATY_UNREACHABLE();
+      }
+    case DW_FORM_ref_addr:
+      if (cu.unit_sizes().dwarf_version() <= 2) {
+        goto address_size;
+      }
+      ABSL_FALLTHROUGH_INTENDED;
+    case DW_FORM_sec_offset:
+      if (cu.unit_sizes().dwarf64()) {
+        return AttrValue(form, ReadFixed<uint64_t>(data));
+      } else {
+        return AttrValue(form, ReadFixed<uint32_t>(data));
+      }
+    case DW_FORM_udata:
+      return AttrValue(form, ReadLEB128<uint64_t>(data));
+    case DW_FORM_block1:
+      return AttrValue(form, ReadBlock<uint8_t>(data));
+    case DW_FORM_block2:
+      return AttrValue(form, ReadBlock<uint16_t>(data));
+    case DW_FORM_block4:
+      return AttrValue(form, ReadBlock<uint32_t>(data));
+    case DW_FORM_block:
+    case DW_FORM_exprloc:
+      return AttrValue(form, ReadVariableBlock(data));
+    case DW_FORM_string:
+      return AttrValue(form, ReadNullTerminated(data));
+    case DW_FORM_strp:
+      if (cu.unit_sizes().dwarf64()) {
+        return AttrValue(form, ReadIndirectString<uint64_t>(cu, data));
+      } else {
+        return AttrValue(form, ReadIndirectString<uint32_t>(cu, data));
+      }
+    case DW_FORM_data1:
+      return AttrValue(form, ReadBytes(1, data));
+    case DW_FORM_data2:
+      return AttrValue(form, ReadBytes(2, data));
+    case DW_FORM_data4:
+      return AttrValue(form, ReadBytes(4, data));
+    case DW_FORM_data8:
+      return AttrValue(form, ReadBytes(8, data));
+    case DW_FORM_loclistx:
+    case DW_FORM_rnglistx:
+      return AttrValue(form, ReadLEB128<uint64_t>(data));
+
+    // Bloaty doesn't currently care about any bool or signed data.
+    // So we fudge it a bit and just stuff these in a uint64.
+    case DW_FORM_flag_present:
+      return AttrValue(form, 1);
+    case DW_FORM_flag:
+      return AttrValue(form, ReadFixed<uint8_t>(data));
+    case DW_FORM_sdata:
+      return AttrValue(form, ReadLEB128<uint64_t>(data));
+    default:
+      THROWF("Don't know how to parse DWARF form: $0", form);
+  }
+}
+
+}  // namepsace dwarf
+}  // namespace bloaty

diff --git a/src/dwarf/attr.h b/src/dwarf/attr.h
new file mode 100644
index 0000000..9261d26
--- /dev/null
+++ b/src/dwarf/attr.h

@@ -0,0 +1,118 @@
+// Copyright 2016 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef BLOATY_DWARF_ATTR_H_
+#define BLOATY_DWARF_ATTR_H_
+
+#include <cstdint>
+
+#include "absl/strings/string_view.h"
+#include "absl/types/optional.h"
+
+namespace bloaty {
+namespace dwarf {
+
+class CU;
+
+class AttrValue {
+ public:
+  static AttrValue ParseAttr(const CU& cu, uint8_t form, absl::string_view* data);
+
+  AttrValue(const AttrValue &) = default;
+  AttrValue &operator=(const AttrValue &) = default;
+
+  uint16_t form() const { return form_; }
+
+  bool IsUint() const {
+    return type_ == Type::kUint || type_ == Type::kUnresolvedUint;
+  }
+
+  bool IsString() const {
+    return type_ == Type::kString || type_ == Type::kUnresolvedString;
+  }
+
+  // Attempts to coerce to uint, returning nullopt if this is not possible.
+  absl::optional<uint64_t> ToUint(const CU& cu) const;
+
+  // REQUIRES: IsUint().
+  uint64_t GetUint(const CU& cu) const;
+
+  // REQUIRES: IsString().
+  absl::string_view GetString(const CU& cu) const;
+
+ private:
+  explicit AttrValue(uint16_t form, uint64_t val)
+      : uint_(val), form_(form), type_(Type::kUint) {}
+  explicit AttrValue(uint16_t form, absl::string_view val)
+      : string_(val), form_(form), type_(Type::kString) {}
+
+  // We delay the resolution of indirect strings and addresses, both to avoid
+  // unnecessary work and because they may depend on base values that occur
+  // after them in the sequence of attributes, eg.
+  //
+  // $ dwarfdump -i bloaty
+  //   COMPILE_UNIT<header overall offset = 0x00000000>:
+  // < 0><0x0000000c>  DW_TAG_compile_unit
+  //                     DW_AT_producer              (indexed string: 0x00000000)Debian clang version 11.0.1-2
+  //                     DW_AT_language              DW_LANG_C_plus_plus_14
+  //                     DW_AT_name                  (indexed string: 0x00000001)../src/main.cc
+  //                     DW_AT_str_offsets_base      0x00000008
+  //
+  // Note that DW_AT_name comes before DW_AT_str_offset_base, but the latter
+  // value is required to resolve the name attribute.
+  enum class Type {
+    kUint,
+    kString,
+    kUnresolvedUint,
+    kUnresolvedString
+  };
+
+  Type type() const { return type_; }
+
+  static AttrValue UnresolvedUint(uint16_t form, uint64_t val) {
+     AttrValue ret(form, val);
+     ret.type_ = Type::kUnresolvedUint;
+     return ret;
+  }
+
+  static AttrValue UnresolvedString(uint16_t form, uint64_t val) {
+     AttrValue ret(form, val);
+     ret.type_ = Type::kUnresolvedString;
+     return ret;
+  }
+
+  union {
+    uint64_t uint_;
+    absl::string_view string_;
+  };
+
+  uint16_t form_;
+  Type type_;
+
+  template <class D>
+  static absl::string_view ReadBlock(absl::string_view* data);
+  static absl::string_view ReadVariableBlock(absl::string_view* data);
+  template <class D>
+  static absl::string_view ReadIndirectString(const CU& cu,
+                                              absl::string_view* data);
+  static absl::string_view ResolveIndirectString(const CU& cu, uint64_t ofs);
+
+  absl::string_view ResolveDoubleIndirectString(const CU &cu) const;
+  uint64_t ResolveIndirectAddress(const CU& cu) const;
+};
+
+}  // namespace dwarf
+}  // namespace bloaty
+
+#endif

diff --git a/src/dwarf/debug_info.cc b/src/dwarf/debug_info.cc
new file mode 100644
index 0000000..5dc917c
--- /dev/null
+++ b/src/dwarf/debug_info.cc

@@ -0,0 +1,277 @@
+// Copyright 2016 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "dwarf/debug_info.h"
+#include "dwarf_constants.h"
+#include "dwarf/dwarf_util.h"
+
+using namespace dwarf2reader;
+
+using absl::string_view;
+
+namespace bloaty {
+namespace dwarf {
+
+void AbbrevTable::ReadAbbrevs(string_view data) {
+  const char* start = data.data();
+  while (true) {
+    uint32_t code = ReadLEB128<uint32_t>(&data);
+
+    if (code == 0) {
+      abbrev_data_ = string_view(start, data.data() - start);
+      return;
+    }
+
+    Abbrev& abbrev = abbrev_[code];
+
+    if (abbrev.code) {
+      THROW("DWARF data contained duplicate abbrev code");
+    }
+
+    uint8_t has_child;
+
+    abbrev.code = code;
+    abbrev.tag = ReadLEB128<uint16_t>(&data);
+    has_child = ReadFixed<uint8_t>(&data);
+
+    switch (has_child) {
+      case DW_children_yes:
+        abbrev.has_child = true;
+        break;
+      case DW_children_no:
+        abbrev.has_child = false;
+        break;
+      default:
+        THROWF("DWARF has_child is neither true nor false: $0, code=$1, tag=$2",
+               has_child, abbrev.code, abbrev.tag);
+    }
+
+    while (true) {
+      Attribute attr;
+      attr.name = ReadLEB128<uint16_t>(&data);
+      attr.form = ReadLEB128<uint8_t>(&data);
+
+      if (attr.name == 0 && attr.form == 0) {
+        break;  // End of this abbrev
+      }
+
+      abbrev.attr.push_back(attr);
+    }
+  }
+}
+
+absl::string_view CompilationUnitSizes::ReadInitialLength(
+    absl::string_view* remaining) {
+  uint64_t len = ReadFixed<uint32_t>(remaining);
+
+  if (len == 0xffffffff) {
+    dwarf64_ = true;
+    len = ReadFixed<uint64_t>(remaining);
+  } else {
+    dwarf64_ = false;
+  }
+
+  if (remaining->size() < len) {
+    THROW("short DWARF compilation unit");
+  }
+
+  absl::string_view unit = *remaining;
+  unit.remove_suffix(remaining->size() - len);
+  *remaining = remaining->substr(len);
+  return unit;
+}
+
+CUIter InfoReader::GetCUIter(Section section, uint64_t offset) {
+  string_view data;
+
+  if (section == Section::kDebugInfo) {
+    data = dwarf_.debug_info;
+  } else {
+    data = dwarf_.debug_types;
+  }
+
+  SkipBytes(offset, &data);
+  return CUIter(section, data);
+}
+
+bool CUIter::NextCU(InfoReader& reader, CU* cu) {
+  if (next_unit_.empty()) return false;
+
+  // Read initial length and calculate entire_unit/data.
+  string_view entire_unit = next_unit_;
+  string_view data = cu->unit_sizes_.ReadInitialLength(&next_unit_);
+  size_t initial_length_len = data.data() - entire_unit.data();
+  entire_unit = entire_unit.substr(0, data.size() + initial_length_len);
+
+  // Delegate to CU to read the unit header.
+  cu->ReadHeader(entire_unit, data, section_, reader);
+  return true;
+}
+
+// Reads the header of this CU from |data|, updating our member variables
+// according to what was parsed.
+void CU::ReadHeader(string_view entire_unit, string_view data,
+                    InfoReader::Section section, InfoReader& reader) {
+  entire_unit_ = entire_unit;
+  dwarf_ = &reader.dwarf_;
+  unit_sizes_.ReadDWARFVersion(&data);
+
+  if (unit_sizes_.dwarf_version() > 5) {
+    THROWF("Data is in DWARF $0 format which we don't understand",
+           unit_sizes_.dwarf_version());
+  }
+
+  uint64_t debug_abbrev_offset;
+
+  if (unit_sizes_.dwarf_version() == 5) {
+    unit_type_ = ReadFixed<uint8_t>(&data);
+    unit_sizes_.SetAddressSize(ReadFixed<uint8_t>(&data));
+    debug_abbrev_offset = unit_sizes_.ReadDWARFOffset(&data);
+
+    switch (unit_type_) {
+      case DW_UT_skeleton:
+      case DW_UT_split_compile:
+      case DW_UT_split_type:
+        dwo_id_ = ReadFixed<uint64_t>(&data);
+        break;
+      case DW_UT_type:
+        unit_type_signature_ = ReadFixed<uint64_t>(&data);
+        unit_type_offset_ = unit_sizes_.ReadDWARFOffset(&data);
+        break;
+      case DW_UT_compile:
+      case DW_UT_partial:
+        break;
+      default:
+        fprintf(stderr, "warning: Unknown DWARF Unit Type in user defined range\n");
+        break;
+    }
+
+  } else {
+    debug_abbrev_offset = unit_sizes_.ReadDWARFOffset(&data);
+    unit_sizes_.SetAddressSize(ReadFixed<uint8_t>(&data));
+
+    if (section == InfoReader::Section::kDebugTypes) {
+      unit_type_signature_ = ReadFixed<uint64_t>(&data);
+      unit_type_offset_ = unit_sizes_.ReadDWARFOffset(&data);
+    }
+  }
+
+  unit_abbrev_ = &reader.abbrev_tables_[debug_abbrev_offset];
+
+  // If we haven't already read abbreviations for this debug_abbrev_offset_, we
+  // need to do so now.
+  if (unit_abbrev_->IsEmpty()) {
+    string_view abbrev_data = dwarf_->debug_abbrev;
+    SkipBytes(debug_abbrev_offset, &abbrev_data);
+    unit_abbrev_->ReadAbbrevs(abbrev_data);
+  }
+
+  data_ = data;
+  ReadTopLevelDIE(reader);
+}
+
+// Read the root-level DIE in order to populate some member variables on which
+// other attributes depend. In particular, we may re-parse this DIE later and
+// read attributes that are relative to these base addresses.
+void CU::ReadTopLevelDIE(InfoReader& reader) {
+  DIEReader die_reader = GetDIEReader();
+  const auto* abbrev = die_reader.ReadCode(*this);
+  absl::optional<uint64_t> stmt_list;
+  unit_name_.clear();
+  die_reader.ReadAttributes(
+      *this, abbrev, [this, &stmt_list](uint16_t tag, dwarf::AttrValue value) {
+        switch (tag) {
+          case DW_AT_name:
+            unit_name_ = std::string(value.GetString(*this));
+            break;
+          case DW_AT_stmt_list:
+            if (value.form() == DW_FORM_sec_offset) {
+              stmt_list = value.GetUint(*this);
+            }
+            break;
+          case DW_AT_addr_base:
+            if (value.form() == DW_FORM_sec_offset) {
+              addr_base_ = value.GetUint(*this);
+            }
+            break;
+          case DW_AT_str_offsets_base:
+            if (value.form() == DW_FORM_sec_offset) {
+              str_offsets_base_ = value.GetUint(*this);
+            }
+            break;
+          case DW_AT_rnglists_base:
+            if (value.form() == DW_FORM_sec_offset) {
+              range_lists_base_ = value.GetUint(*this);
+            }
+            break;
+        }
+      });
+
+  if (stmt_list) {
+    if (unit_name_.empty()) {
+      auto iter = reader.stmt_list_map_.find(*stmt_list);
+      if (iter != reader.stmt_list_map_.end()) {
+        unit_name_ = iter->second;
+      }
+    } else {
+      (reader.stmt_list_map_)[*stmt_list] = unit_name_;
+    }
+  }
+}
+
+void DIEReader::SkipNullEntries() {
+  while (!remaining_.empty() && remaining_[0] == 0) {
+    // null entry terminates a chain of sibling entries.
+    remaining_.remove_prefix(1);
+    depth_--;
+  }
+}
+
+const AbbrevTable::Abbrev* DIEReader::ReadCode(const CU& cu) {
+  SkipNullEntries();
+  if (remaining_.empty()) {
+    return nullptr;
+  }
+  uint32_t code = ReadLEB128<uint32_t>(&remaining_);
+  const AbbrevTable::Abbrev* ret;
+  if (!cu.unit_abbrev_->GetAbbrev(code, &ret)) {
+    THROW("couldn't find abbreviation for code");
+  }
+  if (ret->has_child) {
+    depth_++;
+  }
+  return ret;
+}
+
+void DIEReader::SkipChildren(const CU& cu, const AbbrevTable::Abbrev* abbrev) {
+  if (!abbrev->has_child) {
+    return;
+  }
+
+  int target_depth = depth_ - 1;
+  SkipNullEntries();
+  while (depth_ > target_depth) {
+    // TODO(haberman): use DW_AT_sibling to optimize skipping when it is
+    // available.
+    abbrev = ReadCode(cu);
+    if (!abbrev) {
+      return;
+    }
+    ReadAttributes(cu, abbrev, [](uint16_t, dwarf::AttrValue) {});
+    SkipNullEntries();
+  }
+}
+
+}  // namespace dwarf
+}  // namespace bloaty

diff --git a/src/dwarf/debug_info.h b/src/dwarf/debug_info.h
new file mode 100644
index 0000000..d1b0f79
--- /dev/null
+++ b/src/dwarf/debug_info.h

@@ -0,0 +1,355 @@
+// Copyright 2016 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+// Classes for reading .debug_info and .debug_types.
+//
+// Usage overview:
+//
+//   // Stores/caches abbreviation info and CU names.
+//   dwarf::InfoReader reader;
+//
+//   // Iterator type for enumerating CUs. Initially positioned at the beginning
+//   // of the given section unless you pass an explicit offset.
+//   dwarf::CUIter iter = reader.GetCUIter(
+//       dwarf::InfoReader::Section::kDebugInfo);
+//
+//   // Represents a single CU and vends a lot of useful data about it, like its
+//   // name. Starts out empty/undefined until you call NextCU().
+//   dwarf::CU cu;
+//
+//   while (iter.NextCU(reader, &cu)) {
+//     std::cout << "Parsing CU with name=" << cu.unit_name() << "\n";
+//
+//     // Iterator for enumerating DIEs in a given CU.
+//     dwarf::DIEReader die_reader = cu.GetDIEReader();
+//     while (auto abbrev = die_reader.ReadCode(cu)) {
+//       if (IsInteresting(abbrev->tag)) {
+//         die_reader.ReadAttributes(
+//             cu, abbrev, [](uint16_t tag, dwarf::AttrValue val) {
+//            // Process attribute.
+//         });
+//       } else {
+//         die_reader.SkipChildren(cu, abbrev);
+//       }
+//     }
+//   }
+
+#ifndef BLOATY_DWARF_DEBUG_INFO_H_
+#define BLOATY_DWARF_DEBUG_INFO_H_
+
+#include <functional>
+#include <unordered_map>
+
+#include "absl/strings/string_view.h"
+#include "absl/strings/substitute.h"
+#include "dwarf/attr.h"
+#include "dwarf/dwarf_util.h"
+#include "dwarf_constants.h"
+#include "util.h"
+
+namespace bloaty {
+namespace dwarf {
+
+struct File {
+  absl::string_view debug_abbrev;
+  absl::string_view debug_addr;
+  absl::string_view debug_aranges;
+  absl::string_view debug_info;
+  absl::string_view debug_line;
+  absl::string_view debug_loc;
+  absl::string_view debug_pubnames;
+  absl::string_view debug_pubtypes;
+  absl::string_view debug_ranges;
+  absl::string_view debug_rnglists;
+  absl::string_view debug_str;
+  absl::string_view debug_str_offsets;
+  absl::string_view debug_types;
+
+  absl::string_view* GetFieldByName(absl::string_view name);
+  void SetFieldByName(absl::string_view name, absl::string_view contents) {
+    absl::string_view *member = GetFieldByName(name);
+    if (member) *member = contents;
+  }
+};
+
+// A class that represents the DWARF version and address sizes for a given
+// compilation unit.
+class CompilationUnitSizes {
+ public:
+  // When true, DWARF offsets are 64 bits, otherwise they are 32 bit.
+  bool dwarf64() const { return dwarf64_; }
+
+  // The size of addresses.  Guaranteed to be either 4 or 8.
+  uint8_t address_size() const { return addr8_ ? 8 : 4; }
+
+  // DWARF version of this unit.
+  uint8_t dwarf_version() const { return dwarf_version_; }
+
+  void SetAddressSize(uint8_t address_size) {
+    if (address_size != 4 && address_size != 8) {
+      THROWF("Unexpected address size: $0", address_size);
+    }
+    addr8_ = address_size == 8;
+  }
+
+  // Reads a DWARF offset based on whether we are reading dwarf32 or dwarf64
+  // format.
+  uint64_t ReadDWARFOffset(absl::string_view* data) const {
+    return dwarf64_ ? ReadFixed<uint64_t>(data) : ReadFixed<uint32_t>(data);
+  }
+
+  // Reads an address according to the expected address_size.
+  uint64_t ReadAddress(absl::string_view* data) const {
+    return addr8_ ? ReadFixed<uint64_t>(data) : ReadFixed<uint32_t>(data);
+  }
+
+  uint64_t MaxAddress() const {
+    return addr8_ ? 0xffffffffffffffff : 0xffffffff;
+  }
+
+  // Reads an "initial length" as specified in many DWARF headers.  This
+  // contains either a 32-bit or a 64-bit length, and signals whether we are
+  // using the 32-bit or 64-bit DWARF format (so it sets dwarf64 appropriately).
+  //
+  // Returns the range for this section and stores the remaining data
+  // in |remaining|.
+  absl::string_view ReadInitialLength(absl::string_view* remaining);
+
+  void ReadDWARFVersion(absl::string_view* data) {
+    dwarf_version_ = ReadFixed<uint16_t>(data);
+  }
+
+ private:
+  uint16_t dwarf_version_;
+  bool dwarf64_;
+  bool addr8_;
+};
+
+// AbbrevTable /////////////////////////////////////////////////////////////////
+
+// Parses and stores a representation of (a portion of) the .debug_abbrev
+// section of a DWARF file.  An abbreviation is defined by a unique "code"
+// (unique within one table), and defines the DIE tag and set of attributes.
+// The encoding of the DIE then contains just the abbreviation code and the
+// attribute values -- thanks to the abbreviation table, the tag and attribute
+// keys/names are not required.
+//
+// The abbreviations are an internal detail of the DWARF format and users should
+// not need to care about them.
+
+class AbbrevTable {
+ public:
+  // Reads abbreviations until a terminating abbreviation is seen.
+  void ReadAbbrevs(absl::string_view data);
+
+  // In a DWARF abbreviation, each attribute has a name and a form.
+  struct Attribute {
+    uint16_t name;
+    uint8_t form;
+  };
+
+  // The representation of a single abbreviation.
+  struct Abbrev {
+    uint32_t code;
+    uint16_t tag;
+    bool has_child;
+    std::vector<Attribute> attr;
+  };
+
+  bool IsEmpty() const { return abbrev_.empty(); }
+  absl::string_view abbrev_data() const { return abbrev_data_; }
+
+  // Looks for an abbreviation with the given code.  Returns true if the lookup
+  // succeeded.
+  bool GetAbbrev(uint32_t code, const Abbrev** abbrev) const {
+    auto it = abbrev_.find(code);
+    if (it != abbrev_.end()) {
+      *abbrev = &it->second;
+      return true;
+    } else {
+      return false;
+    }
+  }
+
+ private:
+  // Keyed by abbreviation code.
+  // Generally we expect these to be small, so we could almost use a vector<>.
+  // But you never know what crazy input data is going to do...
+  std::unordered_map<uint32_t, Abbrev> abbrev_;
+  absl::string_view abbrev_data_;
+};
+
+class CUIter;
+class CU;
+class DIEReader;
+
+// Stores/caches abbreviation info and CU names.
+class InfoReader {
+ public:
+  InfoReader(const File& file) : dwarf_(file) {}
+  InfoReader(const InfoReader&) = delete;
+  InfoReader& operator=(const InfoReader&) = delete;
+
+  const File& dwarf() const { return dwarf_; }
+
+  // DIEs exist in both .debug_info and .debug_types.
+  enum class Section {
+    kDebugInfo,
+    kDebugTypes
+  };
+
+  CUIter GetCUIter(Section section, uint64_t offset = 0);
+
+ private:
+  friend class CU;
+  const File& dwarf_;
+
+  std::unordered_map<uint64_t, std::string> stmt_list_map_;
+
+  // All of the AbbrevTables we've read from .debug_abbrev, indexed by their
+  // offset within .debug_abbrev.
+  std::unordered_map<uint64_t, AbbrevTable> abbrev_tables_;
+};
+
+class CUIter {
+ public:
+  bool NextCU(InfoReader& reader, CU* cu);
+
+ private:
+  friend class InfoReader;
+  CUIter(InfoReader::Section section, absl::string_view next_unit)
+      : section_(section), next_unit_(next_unit) {}
+
+  // Data for the next compilation unit.
+  InfoReader::Section section_;
+  absl::string_view next_unit_;
+};
+
+// CompilationUnit: stores info about a single compilation unit in .debug_info
+// or .debug_types.
+class CU {
+ public:
+  DIEReader GetDIEReader();
+
+  const File& dwarf() const { return *dwarf_; }
+  const CompilationUnitSizes& unit_sizes() const { return unit_sizes_; }
+  const std::string& unit_name() const { return unit_name_; }
+  absl::string_view entire_unit() const { return entire_unit_; }
+  uint64_t addr_base() const { return addr_base_; }
+  uint64_t str_offsets_base() const { return str_offsets_base_; }
+  uint64_t range_lists_base() const { return range_lists_base_; }
+  const AbbrevTable& unit_abbrev() const { return *unit_abbrev_; }
+
+  void AddIndirectString(absl::string_view range) const {
+    if (strp_callback_) {
+      strp_callback_(range);
+    }
+  }
+
+  void SetIndirectStringCallback(
+      std::function<void(absl::string_view)> strp_sink) {
+    strp_callback_ = strp_sink;
+  }
+
+  bool IsValidDwarfAddress(uint64_t addr) const {
+    return dwarf::IsValidDwarfAddress(addr, unit_sizes_.address_size());
+  }
+
+ private:
+  friend class CUIter;
+  friend class DIEReader;
+
+  void ReadHeader(absl::string_view entire_unit, absl::string_view data,
+                  InfoReader::Section section, InfoReader& reader);
+  void ReadTopLevelDIE(InfoReader& reader);
+
+  const File* dwarf_;
+
+  // Info that comes from the CU header.
+  absl::string_view entire_unit_;  // Entire CU's range.
+  absl::string_view data_;         // Entire unit excluding CU header.
+  CompilationUnitSizes unit_sizes_;
+  AbbrevTable* unit_abbrev_;
+
+  // Only for skeleton and split CUs.
+  uint8_t unit_type_;
+  uint64_t dwo_id_;
+
+  // Only for .debug_types
+  uint64_t unit_type_signature_;
+  uint64_t unit_type_offset_;
+
+  // Info that comes from the top-level DIE.
+  std::string unit_name_;
+  uint64_t addr_base_ = 0;
+  uint64_t str_offsets_base_ = 0;
+  uint64_t range_lists_base_ = 0;
+
+  std::function<void(absl::string_view)> strp_callback_;
+};
+
+// DIEReader: for reading a sequence of Debugging Information Entries in a
+// compilation unit.
+class DIEReader {
+ public:
+  // Abbreviation for the current entry.
+  const AbbrevTable::Abbrev* ReadCode(const CU& cu);
+
+  template <class T>
+  void ReadAttributes(const CU& cu, const AbbrevTable::Abbrev* code, T&& func);
+
+  void SkipChildren(const CU& cu, const AbbrevTable::Abbrev* code);
+
+ private:
+  // Internal APIs.
+  friend class CU;
+
+  DIEReader(absl::string_view data) : remaining_(data) {}
+  void SkipNullEntries();
+
+  // Our current read position.
+  absl::string_view remaining_;
+  int depth_ = 0;
+};
+
+inline uint64_t ReadIndirectAddress(const CU& cu, uint64_t val) {
+  absl::string_view addrs = cu.dwarf().debug_addr;
+  switch (cu.unit_sizes().address_size()) {
+    case 4:
+      SkipBytes((val * 4) + cu.addr_base(), &addrs);
+      return ReadFixed<uint32_t>(&addrs);
+    case 8:
+      SkipBytes((val * 8) + cu.addr_base(), &addrs);
+      return ReadFixed<uint64_t>(&addrs);
+    default:
+      BLOATY_UNREACHABLE();
+  }
+}
+
+// Reads all attributes for this DIE, calling the given function for each one.
+template <class T>
+void DIEReader::ReadAttributes(const CU& cu, const AbbrevTable::Abbrev* abbrev,
+                               T&& func) {
+  for (auto attr : abbrev->attr) {
+    AttrValue value = AttrValue::ParseAttr(cu, attr.form, &remaining_);
+    func(attr.name, value);
+  }
+}
+
+inline DIEReader CU::GetDIEReader() { return DIEReader(data_); }
+
+}  // namespace dwarf
+}  // namespace bloaty
+
+#endif  // BLOATY_DWARF_DEBUG_INFO_H_

diff --git a/src/dwarf/dwarf_util.cc b/src/dwarf/dwarf_util.cc
new file mode 100644
index 0000000..2eb8f1a
--- /dev/null
+++ b/src/dwarf/dwarf_util.cc

@@ -0,0 +1,75 @@
+// Copyright 2016 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "dwarf/dwarf_util.h"
+
+using string_view = absl::string_view;
+
+namespace bloaty {
+namespace dwarf {
+
+// uint64/32 max is a tombstone value added by https://reviews.llvm.org/D81784.
+bool IsValidDwarfAddress(uint64_t addr, uint8_t address_size) {
+  if (addr == 0)
+    return false;
+  if (address_size == 4 && addr == std::numeric_limits<uint32_t>::max())
+    return false;
+  if (address_size == 8 && addr == std::numeric_limits<uint64_t>::max())
+    return false;
+  return true;
+}
+
+uint64_t ReadLEB128Internal(bool is_signed, string_view* data) {
+  uint64_t ret = 0;
+  int shift = 0;
+  int maxshift = 70;
+  const char* ptr = data->data();
+  const char* limit = ptr + data->size();
+
+  while (ptr < limit && shift < maxshift) {
+    char byte = *(ptr++);
+    ret |= static_cast<uint64_t>(byte & 0x7f) << shift;
+    shift += 7;
+    if ((byte & 0x80) == 0) {
+      data->remove_prefix(ptr - data->data());
+      if (is_signed && shift < 64 && (byte & 0x40)) {
+        ret |= -(1ULL << shift);
+      }
+      return ret;
+    }
+  }
+
+  THROW("corrupt DWARF data, unterminated LEB128");
+}
+
+void SkipLEB128(string_view* data) {
+  size_t limit =
+      std::min(static_cast<size_t>(data->size()), static_cast<size_t>(10));
+  for (size_t i = 0; i < limit; i++) {
+    if (((*data)[i] & 0x80) == 0) {
+      data->remove_prefix(i + 1);
+      return;
+    }
+  }
+
+  THROW("corrupt DWARF data, unterminated LEB128");
+}
+
+absl::string_view ReadDebugStrEntry(absl::string_view debug_str, size_t ofs) {
+  SkipBytes(ofs, &debug_str);
+  return ReadNullTerminated(&debug_str);
+}
+
+}  // namespace dwarf
+}  // namespace bloaty

diff --git a/src/dwarf/dwarf_util.h b/src/dwarf/dwarf_util.h
new file mode 100644
index 0000000..ecb11b4
--- /dev/null
+++ b/src/dwarf/dwarf_util.h

@@ -0,0 +1,55 @@
+// Copyright 2016 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef BLOATY_DWARF_UTIL_H_
+#define BLOATY_DWARF_UTIL_H_
+
+#include <cstdint>
+#include <type_traits>
+
+#include "absl/strings/string_view.h"
+#include "util.h"
+
+namespace bloaty {
+namespace dwarf {
+
+uint64_t ReadLEB128Internal(bool is_signed, absl::string_view* data);
+
+// Reads a DWARF LEB128 varint, where high bits indicate continuation.
+template <typename T>
+T ReadLEB128(absl::string_view* data) {
+  typedef typename std::conditional<std::is_signed<T>::value, int64_t,
+                                    uint64_t>::type Int64Type;
+  Int64Type val = ReadLEB128Internal(std::is_signed<T>::value, data);
+  if (val > std::numeric_limits<T>::max() ||
+      val < std::numeric_limits<T>::min()) {
+    THROW("DWARF data contained larger LEB128 than we were expecting");
+  }
+  return static_cast<T>(val);
+}
+
+void SkipLEB128(absl::string_view* data);
+
+bool IsValidDwarfAddress(uint64_t addr, uint8_t address_size);
+
+inline int DivRoundUp(int n, int d) {
+  return (n + (d - 1)) / d;
+}
+
+absl::string_view ReadDebugStrEntry(absl::string_view debug_str, size_t ofs);
+
+}  // namepsace dwarf
+}  // namepsace bloaty
+
+#endif  // BLOATY_DWARF_UTIL_H_

diff --git a/src/dwarf/line_info.cc b/src/dwarf/line_info.cc
new file mode 100644
index 0000000..c2dfc18
--- /dev/null
+++ b/src/dwarf/line_info.cc

@@ -0,0 +1,288 @@
+// Copyright 2016 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "dwarf/line_info.h"
+
+#include "dwarf/dwarf_util.h"
+#include "dwarf_constants.h"
+
+using namespace dwarf2reader;
+using absl::string_view;
+
+namespace bloaty {
+
+extern int verbose_level;
+
+namespace dwarf {
+
+const std::string& LineInfoReader::GetExpandedFilename(size_t index) {
+  if (index >= filenames_.size()) {
+    THROW("filename index out of range");
+  }
+
+  // Generate these lazily.
+  if (expanded_filenames_.size() <= index) {
+    expanded_filenames_.resize(filenames_.size());
+  }
+
+  std::string& ret = expanded_filenames_[index];
+  if (ret.empty()) {
+    const FileName& filename = filenames_[index];
+    absl::string_view directory = include_directories_[filename.directory_index];
+    ret = std::string(directory);
+    if (!ret.empty()) {
+      ret += "/";
+    }
+    ret += std::string(filename.name);
+  }
+  return ret;
+}
+
+void LineInfoReader::Advance(uint64_t amount) {
+  if (params_.maximum_operations_per_instruction == 1) {
+    // This is by far the common case (only false on VLIW architectuers),
+    // and this inlining/specialization avoids a costly division.
+    DoAdvance(amount, 1);
+  } else {
+    DoAdvance(amount, params_.maximum_operations_per_instruction);
+  }
+}
+
+void LineInfoReader::DoAdvance(uint64_t advance, uint8_t max_per_instr) {
+  info_.address += params_.minimum_instruction_length *
+                    ((info_.op_index + advance) / max_per_instr);
+  info_.op_index = (info_.op_index + advance) % max_per_instr;
+}
+
+void LineInfoReader::SpecialOpcodeAdvance(uint8_t op) {
+  Advance(AdjustedOpcode(op) / params_.line_range);
+}
+
+uint8_t LineInfoReader::AdjustedOpcode(uint8_t op) {
+  return op - params_.opcode_base;
+}
+
+void LineInfoReader::SeekToOffset(uint64_t offset, uint8_t address_size) {
+  string_view data = file_.debug_line;
+  SkipBytes(offset, &data);
+
+  sizes_.SetAddressSize(address_size);
+  data = sizes_.ReadInitialLength(&data);
+  sizes_.ReadDWARFVersion(&data);
+  uint64_t header_length = sizes_.ReadDWARFOffset(&data);
+  string_view program = data;
+  SkipBytes(header_length, &program);
+
+  params_.minimum_instruction_length = ReadFixed<uint8_t>(&data);
+  if (sizes_.dwarf_version() == 4) {
+    params_.maximum_operations_per_instruction = ReadFixed<uint8_t>(&data);
+
+    if (params_.maximum_operations_per_instruction == 0) {
+      THROW("DWARF line info had maximum_operations_per_instruction=0");
+    }
+  } else {
+    params_.maximum_operations_per_instruction = 1;
+  }
+  params_.default_is_stmt = ReadFixed<uint8_t>(&data);
+  params_.line_base = ReadFixed<int8_t>(&data);
+  params_.line_range = ReadFixed<uint8_t>(&data);
+  params_.opcode_base = ReadFixed<uint8_t>(&data);
+  if (params_.line_range == 0) {
+    THROW("line_range of zero will cause divide by zero");
+  }
+
+  standard_opcode_lengths_.resize(params_.opcode_base);
+  for (size_t i = 1; i < params_.opcode_base; i++) {
+    standard_opcode_lengths_[i] = ReadFixed<uint8_t>(&data);
+  }
+
+  // Read include_directories.
+  include_directories_.clear();
+
+  // Implicit current directory entry.
+  include_directories_.push_back(string_view());
+
+  while (true) {
+    string_view dir = ReadNullTerminated(&data);
+    if (dir.empty()) {
+      break;
+    }
+    include_directories_.push_back(dir);
+  }
+
+  // Read file_names.
+  filenames_.clear();
+  expanded_filenames_.clear();
+
+  // Filename 0 is unused.
+  filenames_.push_back(FileName());
+  while (true) {
+    FileName file_name;
+    file_name.name = ReadNullTerminated(&data);
+    if (file_name.name.empty()) {
+      break;
+    }
+    file_name.directory_index = ReadLEB128<uint32_t>(&data);
+    file_name.modified_time = ReadLEB128<uint64_t>(&data);
+    file_name.file_size = ReadLEB128<uint64_t>(&data);
+    if (file_name.directory_index >= include_directories_.size()) {
+      THROW("directory index out of range");
+    }
+    filenames_.push_back(file_name);
+  }
+
+  info_ = LineInfo(params_.default_is_stmt);
+  remaining_ = program;
+  shadow_ = false;
+}
+
+bool LineInfoReader::ReadLineInfo() {
+  // Final step of last DW_LNS_copy / special opcode.
+  info_.discriminator = 0;
+  info_.basic_block = false;
+  info_.prologue_end = false;
+  info_.epilogue_begin = false;
+
+  // Final step of DW_LNE_end_sequence.
+  info_.end_sequence = false;
+
+  string_view data = remaining_;
+
+  while (true) {
+    if (data.empty()) {
+      remaining_ = data;
+      return false;
+    }
+
+    uint8_t op = ReadFixed<uint8_t>(&data);
+
+    if (op >= params_.opcode_base) {
+      SpecialOpcodeAdvance(op);
+      info_.line +=
+          params_.line_base + (AdjustedOpcode(op) % params_.line_range);
+      if (!shadow_) {
+        remaining_ = data;
+        return true;
+      }
+    } else {
+      switch (op) {
+        case DW_LNS_extended_op: {
+          uint16_t len = ReadLEB128<uint16_t>(&data);
+          uint8_t extended_op = ReadFixed<uint8_t>(&data);
+          switch (extended_op) {
+            case DW_LNE_end_sequence: {
+              // Preserve address and set end_sequence, but reset everything
+              // else.
+              uint64_t addr = info_.address;
+              info_ = LineInfo(params_.default_is_stmt);
+              info_.address = addr;
+              info_.end_sequence = true;
+              if (!shadow_) {
+                remaining_ = data;
+                return true;
+              }
+              break;
+            }
+            case DW_LNE_set_address:
+              info_.address = sizes_.ReadAddress(&data);
+              info_.op_index = 0;
+              shadow_ = (info_.address == 0);
+              break;
+            case DW_LNE_define_file: {
+              FileName file_name;
+              file_name.name = ReadNullTerminated(&data);
+              file_name.directory_index = ReadLEB128<uint32_t>(&data);
+              file_name.modified_time = ReadLEB128<uint64_t>(&data);
+              file_name.file_size = ReadLEB128<uint64_t>(&data);
+              if (file_name.directory_index >= include_directories_.size()) {
+                THROW("directory index out of range");
+              }
+              filenames_.push_back(file_name);
+              break;
+            }
+            case DW_LNE_set_discriminator:
+              info_.discriminator = ReadLEB128<uint32_t>(&data);
+              break;
+            default:
+              // We don't understand this opcode, skip it.
+              SkipBytes(len, &data);
+              if (verbose_level > 0) {
+                fprintf(stderr,
+                        "bloaty: warning: unknown DWARF line table extended "
+                        "opcode: %d\n",
+                        extended_op);
+              }
+              break;
+          }
+          break;
+        }
+        case DW_LNS_copy:
+          if (!shadow_) {
+            remaining_ = data;
+            return true;
+          }
+          break;
+        case DW_LNS_advance_pc:
+          Advance(ReadLEB128<uint64_t>(&data));
+          break;
+        case DW_LNS_advance_line:
+          info_.line += ReadLEB128<int32_t>(&data);
+          break;
+        case DW_LNS_set_file:
+          info_.file = ReadLEB128<uint32_t>(&data);
+          if (info_.file >= filenames_.size()) {
+            THROW("filename index too big");
+          }
+          break;
+        case DW_LNS_set_column:
+          info_.column = ReadLEB128<uint32_t>(&data);
+          break;
+        case DW_LNS_negate_stmt:
+          info_.is_stmt = !info_.is_stmt;
+          break;
+        case DW_LNS_set_basic_block:
+          info_.basic_block = true;
+          break;
+        case DW_LNS_const_add_pc:
+          SpecialOpcodeAdvance(255);
+          break;
+        case DW_LNS_fixed_advance_pc:
+          info_.address += ReadFixed<uint16_t>(&data);
+          info_.op_index = 0;
+          break;
+        case DW_LNS_set_prologue_end:
+          info_.prologue_end = true;
+          break;
+        case DW_LNS_set_epilogue_begin:
+          info_.epilogue_begin = true;
+          break;
+        case DW_LNS_set_isa:
+          info_.isa = ReadLEB128<uint8_t>(&data);
+          break;
+        default:
+          // Unknown opcode, but we know its length so can skip it.
+          SkipBytes(standard_opcode_lengths_[op], &data);
+          if (verbose_level > 0) {
+            fprintf(stderr,
+                    "bloaty: warning: unknown DWARF line table opcode: %d\n",
+                    op);
+          }
+          break;
+      }
+    }
+  }
+}
+
+}  // namespace dwarf
+}  // namespace bloaty

diff --git a/src/dwarf/line_info.h b/src/dwarf/line_info.h
new file mode 100644
index 0000000..789e665
--- /dev/null
+++ b/src/dwarf/line_info.h

@@ -0,0 +1,118 @@
+// Copyright 2016 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef BLOATY_DWARF_LINE_INFO_H_
+#define BLOATY_DWARF_LINE_INFO_H_
+
+#include <cstdint>
+
+#include "absl/strings/string_view.h"
+#include "dwarf/debug_info.h"
+
+// Code to read the .line_info programs in a DWARF file.  Currently we use this
+// for the "inlines" data source, but I think we should probably use the
+// inlining info in debug_info instead.
+//
+// Usage overview:
+//   dwarf::LineInfoReader reader(file);
+//   
+//   reader.SeekToOffset(ofs, cu.unit_sizes().address_size());
+//   while (reader->ReadLineInfo()) {
+//     const dwarf::LineInfo& info = reader->lineinfo();
+//     // ...
+//   }
+
+namespace bloaty {
+namespace dwarf {
+
+class LineInfoReader {
+ public:
+  LineInfoReader(const File& file) : file_(file), info_(0) {}
+
+  struct LineInfo {
+    LineInfo(bool default_is_stmt) : is_stmt(default_is_stmt) {}
+    uint64_t address = 0;
+    uint32_t file = 1;
+    uint32_t line = 1;
+    uint32_t column = 0;
+    uint32_t discriminator = 0;
+    bool end_sequence = false;
+    bool basic_block = false;
+    bool prologue_end = false;
+    bool epilogue_begin = false;
+    bool is_stmt;
+    uint8_t op_index = 0;
+    uint8_t isa = 0;
+  };
+
+  struct FileName {
+    absl::string_view name;
+    uint32_t directory_index;
+    uint64_t modified_time;
+    uint64_t file_size;
+  };
+
+  void SeekToOffset(uint64_t offset, uint8_t address_size);
+  bool ReadLineInfo();
+  const LineInfo& lineinfo() const { return info_; }
+  const FileName& filename(size_t i) const { return filenames_[i]; }
+  absl::string_view include_directory(size_t i) const {
+    return include_directories_[i];
+  }
+
+  const std::string& GetExpandedFilename(size_t index);
+
+ private:
+  struct Params {
+    uint8_t minimum_instruction_length;
+    uint8_t maximum_operations_per_instruction;
+    uint8_t default_is_stmt;
+    int8_t line_base;
+    uint8_t line_range;
+    uint8_t opcode_base;
+  } params_;
+
+  const File& file_;
+
+  CompilationUnitSizes sizes_;
+  std::vector<absl::string_view> include_directories_;
+  std::vector<FileName> filenames_;
+  std::vector<uint8_t> standard_opcode_lengths_;
+  std::vector<std::string> expanded_filenames_;
+
+  absl::string_view remaining_;
+
+  // Whether we are in a "shadow" part of the bytecode program.  Sometimes
+  // parts of the line info program make it into the final binary even though
+  // the corresponding code was stripped.  We can tell when this happened by
+  // looking for DW_LNE_set_address ops where the operand is 0.  This
+  // indicates that a relocation for that argument never got applied, which
+  // probably means that the code got stripped.
+  //
+  // While this is true, we don't yield any LineInfo entries, because the
+  // "address" value is garbage.
+  bool shadow_;
+
+  LineInfo info_;
+
+  void DoAdvance(uint64_t advance, uint8_t max_per_instr);
+  void Advance(uint64_t amount);
+  uint8_t AdjustedOpcode(uint8_t op);
+  void SpecialOpcodeAdvance(uint8_t op);
+};
+
+}  // namespace dwarf
+}  // namespace bloaty
+
+#endif  // BLOATY_DWARF_LINE_INFO_H_

diff --git a/src/eh_frame.cc b/src/eh_frame.cc
new file mode 100644
index 0000000..1a6aedf
--- /dev/null
+++ b/src/eh_frame.cc

@@ -0,0 +1,264 @@
+// Copyright 2016 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "bloaty.h"
+#include "util.h"
+#include "absl/strings/string_view.h"
+#include "dwarf_constants.h"
+#include "dwarf/dwarf_util.h"
+
+using absl::string_view;
+using namespace dwarf2reader;
+
+namespace bloaty {
+
+uint64_t ReadEncodedPointer(uint8_t encoding, bool is_64bit, string_view* data,
+                            const char* data_base, RangeSink* sink) {
+  uint64_t value;
+  const char* ptr = data->data();
+  uint8_t format = encoding & DW_EH_PE_FORMAT_MASK;
+
+  switch (format) {
+    case DW_EH_PE_omit:
+      return 0;
+    case DW_EH_PE_absptr:
+      if (is_64bit) {
+        value = ReadFixed<uint64_t>(data);
+      } else {
+        value = ReadFixed<uint32_t>(data);
+      }
+      break;
+    case DW_EH_PE_uleb128:
+      value = dwarf::ReadLEB128<uint64_t>(data);
+      break;
+    case DW_EH_PE_udata2:
+      value = ReadFixed<uint16_t>(data);
+      break;
+    case DW_EH_PE_udata4:
+      value = ReadFixed<uint32_t>(data);
+      break;
+    case DW_EH_PE_udata8:
+      value = ReadFixed<uint64_t>(data);
+      break;
+    case DW_EH_PE_sleb128:
+      value = dwarf::ReadLEB128<int64_t>(data);
+      break;
+    case DW_EH_PE_sdata2:
+      value = ReadFixed<int16_t>(data);
+      break;
+    case DW_EH_PE_sdata4:
+      value = ReadFixed<int32_t>(data);
+      break;
+    case DW_EH_PE_sdata8:
+      value = ReadFixed<int64_t>(data);
+      break;
+    default:
+      THROWF("Unexpected eh_frame format value: $0", format);
+  }
+
+  uint8_t application = encoding & DW_EH_PE_APPLICATION_MASK;
+
+  switch (application) {
+    case 0:
+      break;
+    case DW_EH_PE_pcrel:
+      value += sink->TranslateFileToVM(ptr);
+      break;
+    case DW_EH_PE_datarel:
+      if (data_base == nullptr) {
+        THROW("datarel requested but no data_base provided");
+      }
+      value += sink->TranslateFileToVM(data_base);
+      break;
+    case DW_EH_PE_textrel:
+    case DW_EH_PE_funcrel:
+    case DW_EH_PE_aligned:
+      THROWF("Unimplemented eh_frame application value: $0", application);
+  }
+
+  if (encoding & DW_EH_PE_indirect) {
+    string_view location = sink->TranslateVMToFile(value);
+    if (is_64bit) {
+      value = ReadFixed<uint64_t>(&location);
+    } else {
+      value = ReadFixed<uint32_t>(&location);
+    }
+  }
+
+  return value;
+}
+
+// Code to read the .eh_frame section.  This is not technically DWARF, but it
+// is similar to .debug_frame (which is DWARF) so it's convenient to put it
+// here.
+//
+// The best documentation I can find for this format comes from:
+//
+// *
+// http://refspecs.linuxfoundation.org/LSB_5.0.0/LSB-Core-generic/LSB-Core-generic/ehframechpt.html
+// * https://www.airs.com/blog/archives/460
+//
+// However these are both under-specified.  Some details are not mentioned in
+// either of these (for example, the fact that the function length uses the FDE
+// encoding, but always absolute).  libdwarf's implementation contains a comment
+// saying "It is not clear if this is entirely correct".  Basically the only
+// thing you can trust for some of these details is the code that actually
+// implements unwinding in production:
+//
+// * libunwind http://www.nongnu.org/libunwind/
+//   https://github.com/pathscale/libunwind/blob/master/src/dwarf/Gfde.c
+// * LLVM libunwind (a different project!!)
+//   https://github.com/llvm-mirror/libunwind/blob/master/src/DwarfParser.hpp
+// * libgcc
+//   https://github.com/gcc-mirror/gcc/blob/master/libgcc/unwind-dw2-fde.c
+void ReadEhFrame(string_view data, RangeSink* sink) {
+  string_view remaining = data;
+
+  struct CIEInfo {
+    int version = 0;
+    uint32_t code_align = 0;
+    int32_t data_align = 0;
+    uint8_t fde_encoding = 0;
+    uint8_t lsda_encoding = 0;
+    bool is_signal_handler = false;
+    bool has_augmentation_length = false;
+    uint64_t personality_function = 0;
+    uint32_t return_address_reg = 0;
+  };
+
+  std::unordered_map<const void*, CIEInfo> cie_map;
+
+  while (remaining.size() > 0) {
+    dwarf::CompilationUnitSizes sizes;
+    string_view full_entry = remaining;
+    string_view entry = sizes.ReadInitialLength(&remaining);
+    if (entry.size() == 0 && remaining.size() == 0) {
+      return;
+    }
+    full_entry =
+        full_entry.substr(0, entry.size() + (entry.data() - full_entry.data()));
+    uint32_t id = ReadFixed<uint32_t>(&entry);
+    if (id == 0) {
+      // CIE, we don't attribute this yet.
+      CIEInfo& cie_info = cie_map[full_entry.data()];
+      cie_info.version = ReadFixed<uint8_t>(&entry);
+      string_view aug_string = ReadNullTerminated(&entry);
+      cie_info.code_align = dwarf::ReadLEB128<uint32_t>(&entry);
+      cie_info.data_align = dwarf::ReadLEB128<int32_t>(&entry);
+      switch (cie_info.version) {
+        case 1:
+          cie_info.return_address_reg = ReadFixed<uint8_t>(&entry);
+          break;
+        case 3:
+          cie_info.return_address_reg = dwarf::ReadLEB128<uint32_t>(&entry);
+          break;
+        default:
+          THROW("Unexpected eh_frame CIE version");
+      }
+      while (aug_string.size() > 0) {
+        switch (aug_string[0]) {
+          case 'z':
+            // Length until the end of augmentation data.
+            cie_info.has_augmentation_length = true;
+            dwarf::ReadLEB128<uint32_t>(&entry);
+            break;
+          case 'L':
+            cie_info.lsda_encoding = ReadFixed<uint8_t>(&entry);
+            break;
+          case 'R':
+            cie_info.fde_encoding = ReadFixed<uint8_t>(&entry);
+            break;
+          case 'S':
+            cie_info.is_signal_handler = true;
+            break;
+          case 'P': {
+            uint8_t encoding = ReadFixed<uint8_t>(&entry);
+            cie_info.personality_function =
+                ReadEncodedPointer(encoding, true, &entry, nullptr, sink);
+            break;
+          }
+          default:
+            THROW("Unexepcted augmentation character");
+        }
+        aug_string.remove_prefix(1);
+      }
+    } else {
+      auto iter = cie_map.find(entry.data() - id - 4);
+      if (iter == cie_map.end()) {
+        THROW("Couldn't find CIE for FDE");
+      }
+      const CIEInfo& cie_info = iter->second;
+      // TODO(haberman): don't hard-code 64-bit.
+      uint64_t address = ReadEncodedPointer(cie_info.fde_encoding, true, &entry,
+                                            nullptr, sink);
+      // TODO(haberman); Technically the FDE addresses could span a
+      // function/compilation unit?  They can certainly span inlines.
+      /*
+      uint64_t length =
+        ReadEncodedPointer(cie_info.fde_encoding & 0xf, true, &entry, sink);
+      (void)length;
+
+      if (cie_info.has_augmentation_length) {
+        uint32_t augmentation_length = dwarf::ReadLEB128<uint32_t>(&entry);
+        (void)augmentation_length;
+      }
+
+      uint64_t lsda =
+          ReadEncodedPointer(cie_info.lsda_encoding, true, &entry, sink);
+      if (lsda) {
+      }
+      */
+
+      sink->AddFileRangeForVMAddr("dwarf_fde", address, full_entry);
+    }
+  }
+}
+
+// See documentation here:
+//   http://refspecs.linuxfoundation.org/LSB_5.0.0/LSB-Core-generic/LSB-Core-generic/ehframechpt.html#EHFRAME
+void ReadEhFrameHdr(string_view data, RangeSink* sink) {
+  const char* base = data.data();
+  uint8_t version = ReadFixed<uint8_t>(&data);
+  uint8_t eh_frame_ptr_enc = ReadFixed<uint8_t>(&data);
+  uint8_t fde_count_enc = ReadFixed<uint8_t>(&data);
+  uint8_t table_enc = ReadFixed<uint8_t>(&data);
+
+  if (version != 1) {
+    THROWF("Unknown eh_frame_hdr version: $0", version);
+  }
+
+  // TODO(haberman): don't hard-code 64-bit.
+  uint64_t eh_frame_ptr =
+      ReadEncodedPointer(eh_frame_ptr_enc, true, &data, base, sink);
+  (void)eh_frame_ptr;
+  uint64_t fde_count =
+      ReadEncodedPointer(fde_count_enc, true, &data, base, sink);
+
+  for (uint64_t i = 0; i < fde_count; i++) {
+    string_view entry_data = data;
+    uint64_t initial_location =
+        ReadEncodedPointer(table_enc, true, &data, base, sink);
+    uint64_t fde_addr = ReadEncodedPointer(table_enc, true, &data, base, sink);
+    entry_data.remove_suffix(data.size());
+    sink->AddFileRangeForVMAddr("dwarf_fde_table", initial_location,
+                                entry_data);
+
+    // We could add fde_addr with an unknown length if we wanted to skip reading
+    // eh_frame.  We can't count on this table being available though, so we
+    // don't want to remove the eh_frame reading code altogether.
+    (void)fde_addr;
+  }
+}
+
+}  // namespace bloaty

diff --git a/src/elf.cc b/src/elf.cc
index 355210b..79d9cc7 100644
--- a/src/elf.cc
+++ b/src/elf.cc

@@ -744,12 +744,12 @@
 //
 // - 24 bits for index (up to 16M symbols with -ffunction-sections)
 // - 40 bits for address (up to 1TB section)
-static uint64_t ToVMAddr(size_t addr, uint64_t ndx, bool is_object) {
+static uint64_t ToVMAddr(uint64_t addr, uint64_t ndx, bool is_object) {
   if (is_object) {
     if (ndx >= 1 << 24) {
       THROW("ndx overflow: too many sections");
     }
-    if (addr >= 1ULL << 40) {
+    if (addr >= ((uint64_t)1) << 40) {
       THROW("address overflow: section too big");
     }
     return (ndx << 40) | addr;
@@ -1332,7 +1332,7 @@
                          false);
           dwarf::File dwarf;
           ReadDWARFSections(debug_file().file_data(), &dwarf, sink);
-          ReadDWARFCompileUnits(dwarf, symtab, symbol_map, sink);
+          ReadDWARFCompileUnits(dwarf, symbol_map, sink);
           break;
         }
         case DataSource::kInlines: {

diff --git a/src/macho.cc b/src/macho.cc
index 2c25c5b..f399853 100644
--- a/src/macho.cc
+++ b/src/macho.cc

@@ -584,7 +584,7 @@
           ParseSymbols(debug_file().file_data().data(), &symtab, &symbol_sink);
           dwarf::File dwarf;
           ReadDebugSectionsFromMachO(debug_file().file_data(), &dwarf, sink);
-          ReadDWARFCompileUnits(dwarf, symtab, symbol_map, sink);
+          ReadDWARFCompileUnits(dwarf, symbol_map, sink);
           ParseSymbols(sink->input_file().data(), nullptr, sink);
           break;
         }

diff --git a/src/pe.cc b/src/pe.cc
index 4a0364b..6326450 100644
--- a/src/pe.cc
+++ b/src/pe.cc

@@ -69,6 +69,7 @@
 
   bool IsOpen() const { return ok_; }
 
+  string_view entire_file() const { return data_; }
   string_view header_region() const { return header_region_; }
 
   uint32_t section_count() const { return section_count_; }
@@ -87,7 +88,7 @@
 
   bool ok_;
   bool is_64bit_;
-  string_view data_;
+  const string_view data_;
 
   pe_dos_header dos_header_;
   pe_header pe_header_;
@@ -182,15 +183,13 @@
 
 void ParseSections(const PeFile& pe, RangeSink* sink) {
   assert(pe.IsOpen());
-  ForEachSection(pe, [sink](const Section& section) {
+  ForEachSection(pe, [sink, &pe](const Section& section) {
     uint64_t vmaddr = section.virtual_addr();
     uint64_t vmsize = section.virtual_size();
+    absl::string_view section_data = StrictSubstr(
+        pe.entire_file(), section.raw_offset(), section.raw_size());
 
-    uint64_t fileoff = section.raw_offset();
-    uint64_t filesize = section.raw_size();
-
-    sink->AddRange("pe_sections", section.name, vmaddr, vmsize, fileoff,
-                   filesize);
+    sink->AddRange("pe_sections", section.name, vmaddr, vmsize, section_data);
   });
 }
 

diff --git a/src/util.h b/src/util.h
index b934027..4db4b8b 100644
--- a/src/util.h
+++ b/src/util.h

@@ -19,6 +19,7 @@
 
 #include "absl/numeric/int128.h"
 #include "absl/strings/string_view.h"
+#include "absl/strings/substitute.h"
 
 namespace bloaty {
 

diff --git a/src/webassembly.cc b/src/webassembly.cc
index c2c6e9a..9d1ccc0 100644
--- a/src/webassembly.cc
+++ b/src/webassembly.cc

@@ -101,7 +101,7 @@
     uint32_t size = ReadVarUInt32(&data);
     ret.contents = ReadPiece(size, &data);
     size_t header_size = ret.contents.data() - section_data.data();
-    ret.data = section_data.substr(0, size + header_size);
+    ret.data = ReadPiece(size + header_size, &section_data);
 
     if (ret.id == 0) {
       uint32_t name_len = ReadVarUInt32(&ret.contents);
@@ -193,8 +193,7 @@
   while (!data.empty()) {
     char type = ReadVarUInt7(&data);
     uint32_t size = ReadVarUInt32(&data);
-    string_view section = data.substr(0, size);
-    data = data.substr(size);
+    string_view section = ReadPiece(size, &data);
 
     if (static_cast<NameType>(type) == NameType::kFunction) {
       uint32_t count = ReadVarUInt32(&section);
@@ -203,7 +202,7 @@
         uint32_t index = ReadVarUInt32(&section);
         uint32_t name_len = ReadVarUInt32(&section);
         string_view name = ReadPiece(name_len, &section);
-        entry = entry.substr(0, name.data() - entry.data() + name.size());
+        entry = StrictSubstr(entry, 0, name.data() - entry.data() + name.size());
         sink->AddFileRange("wasm_funcname", name, entry);
         (*names)[index] = std::string(name);
       }
@@ -288,8 +287,8 @@
     uint32_t size = ReadVarUInt32(&data);
     uint32_t total_size = size + (data.data() - func.data());
 
-    func = func.substr(0, total_size);
-    data = data.substr(size);
+    func = StrictSubstr(func, 0, total_size);
+    data = StrictSubstr(data, size);
 
     auto iter = names.find(num_imports + i);
 
@@ -332,7 +331,7 @@
     sink->AddFileRange("wasm_overhead", name2, section.data);
   });
   sink->AddFileRange("wasm_overhead", "[WASM Header]",
-                     sink->input_file().data().substr(0, 8));
+                     StrictSubstr(sink->input_file().data(), 0, 8));
 }
 
 class WebAssemblyObjectFile : public ObjectFile {

diff --git a/tests/dwarf/debug_info/ignore-declarations.test b/tests/dwarf/debug_info/ignore-declarations.test
index 16ac641..e88fbf5 100644
--- a/tests/dwarf/debug_info/ignore-declarations.test
+++ b/tests/dwarf/debug_info/ignore-declarations.test

@@ -1,6 +1,13 @@
 # Test that we properly ignore DIEs that have DW_AT_declaration=true.
 # This indicates a function that was declared, but not defined.
 # We don't want to register declarations, only definitions.
+#
+# This test is somewhat unrealistic, as it contains DIEs we would
+# probably never see in the real world (specifically, DIEs that have
+# both DW_AT_declaration and DW_AT_low_pc). However this may be the
+# only way of testing that we are truly skipping declarations, since
+# the skipping of declarations may not have any actual observable
+# effect on real-world data.
 
 # RUN: %yaml2obj %s --docnum=1 -o %t.obj
 # RUN: %yaml2obj %s --docnum=2 -o %t.dwo
@@ -49,31 +56,10 @@
       - Name:            GNU
         Desc:            6CF422D909772A0FB5400518A689D9F15F14BF57
         Type:            0x3  # NT_GNU_BUILD_ID
-  - Name:            .text
-    Type:            SHT_PROGBITS
-    Flags:           [ SHF_ALLOC, SHF_EXECINSTR ]
-    Address:         0x1000
-    AddressAlign:    0x10
-    Size:            0x20
-Symbols:
-  - Name:            foo_func
-    Type:            STT_FUNC
-    Section:         .text
-    Binding:         STB_GLOBAL
-    Value:           0x1000
-    Size:            0x10
-  - Name:            bar_func
-    Type:            STT_FUNC
-    Section:         .text
-    Binding:         STB_GLOBAL
-    Value:           0x1010
-    Size:            0x10
 DWARF:
   debug_str:
     - foo.c
     - bar.c
-    - foo_func
-    - bar_func
   debug_abbrev:
     - ID:              0
       Table:
@@ -87,26 +73,33 @@
           Tag:             DW_TAG_subprogram
           Children:        DW_CHILDREN_no
           Attributes:
-            - Attribute:       DW_AT_linkage_name
-              Form:            DW_FORM_strp
+            - Attribute:       DW_AT_low_pc
+              Form:            DW_FORM_addr
+            - Attribute:       DW_AT_high_pc
+              Form:            DW_FORM_data4
             - Attribute:       DW_AT_declaration
               Form:            DW_FORM_flag_present
         - Code:            0x3
           Tag:             DW_TAG_subprogram
           Children:        DW_CHILDREN_no
           Attributes:
-            - Attribute:       DW_AT_linkage_name
-              Form:            DW_FORM_strp
+            - Attribute:       DW_AT_low_pc
+              Form:            DW_FORM_addr
+            - Attribute:       DW_AT_high_pc
+              Form:            DW_FORM_data4
   debug_info:
     # 0x0000000b: DW_TAG_compile_unit
-    #               DW_AT_name        ("foo.c")
+    #               DW_AT_name	("foo.c")
     #
     # 0x00000010:   DW_TAG_subprogram
-    #                 DW_AT_linkage_name      ("bar_func")
-    #                 DW_AT_declaration       (true)
+    #                 DW_AT_low_pc	(0x0000000000001000)
+    #                 DW_AT_high_pc	(0x0000000000001010)
+    #                 # This entry should be ignored because declaration=true.
+    #                 DW_AT_declaration	(true)
     #
-    # 0x00000015:   DW_TAG_subprogram
-    #                 DW_AT_linkage_name      ("foo_func")
+    # 0x0000001d:   DW_TAG_subprogram
+    #                 DW_AT_low_pc	(0x0000000000001010)
+    #                 DW_AT_high_pc	(0x0000000000001020)
     - Version:         4
       AbbrevTableID:   0
       AbbrOffset:      0x0
@@ -117,16 +110,19 @@
             - Value:           0x0
         - AbbrCode:        0x2
           Values:
-            - Value:           0x15
+            - Value:           0x1000
+            - Value:           0x10
         - AbbrCode:        0x3
           Values:
-            - Value:           0xc
+            - Value:           0x1010
+            - Value:           0x10
         - AbbrCode:        0x0
-    # 0x00000026: DW_TAG_compile_unit
-    #               DW_AT_name        ("bar.c")
-    #
-    # 0x0000002b:   DW_TAG_subprogram
-    #                 DW_AT_linkage_name      ("bar_func")
+    # 0x00000036: DW_TAG_compile_unit
+    #               DW_AT_name	("bar.c")
+    # 
+    # 0x0000003b:   DW_TAG_subprogram
+    #                 DW_AT_low_pc	(0x0000000000001000)
+    #                 DW_AT_high_pc	(0x0000000000001010)
     - Version:         4
       AbbrevTableID:   0
       AbbrOffset:      0x0
@@ -137,11 +133,12 @@
             - Value:           0x6
         - AbbrCode:        0x3
           Values:
-            - Value:           0x15
+            - Value:           0x1000
+            - Value:           0x10
         - AbbrCode:        0x0
 ...
 
 # CHECK: VM MAP:
 # CHECK: 0000-1000              4096             [-- Nothing mapped --]
-# CHECK: 1000-1010                16             foo.c
-# CHECK: 1010-1020                16             bar.c
+# CHECK: 1000-1010                16             bar.c
+# CHECK: 1010-1020                16             foo.c

diff --git a/tests/testdata/fuzz_corpus/clusterfuzz-testcase-minimized-fuzz_target-5640071541161984 b/tests/testdata/fuzz_corpus/clusterfuzz-testcase-minimized-fuzz_target-5640071541161984
new file mode 100644
index 0000000..bd612e9
--- /dev/null
+++ b/tests/testdata/fuzz_corpus/clusterfuzz-testcase-minimized-fuzz_target-5640071541161984
Binary files differ

diff --git a/tests/testdata/fuzz_corpus/clusterfuzz-testcase-minimized-fuzz_target-6500838179733504 b/tests/testdata/fuzz_corpus/clusterfuzz-testcase-minimized-fuzz_target-6500838179733504
new file mode 100644
index 0000000..72cbeb9
--- /dev/null
+++ b/tests/testdata/fuzz_corpus/clusterfuzz-testcase-minimized-fuzz_target-6500838179733504
Binary files differ

diff --git a/tests/testdata/fuzz_corpus/testcase-4665949898276864 b/tests/testdata/fuzz_corpus/testcase-4665949898276864
new file mode 100644
index 0000000..4a82bb0
--- /dev/null
+++ b/tests/testdata/fuzz_corpus/testcase-4665949898276864
Binary files differ

diff --git a/tests/testdata/fuzz_corpus/testcase-5207237867470848 b/tests/testdata/fuzz_corpus/testcase-5207237867470848
new file mode 100644
index 0000000..5dcf301
--- /dev/null
+++ b/tests/testdata/fuzz_corpus/testcase-5207237867470848
Binary files differ

diff --git a/tests/testdata/fuzz_corpus/testcase-5896363763695616 b/tests/testdata/fuzz_corpus/testcase-5896363763695616
new file mode 100644
index 0000000..8012570
--- /dev/null
+++ b/tests/testdata/fuzz_corpus/testcase-5896363763695616
Binary files differ
commit	58b103866b45cc534a860c136ac82ae8caa16f46	[log] [tgz]
author	Joshua Haberman <jhaberman@gmail.com>	Sun Aug 08 16:25:54 2021 -0700
committer	Joshua Haberman <jhaberman@gmail.com>	Sun Aug 08 16:25:54 2021 -0700
tree	01250b008546e2912260faf6fba30ef228881864
parent	c952309265f1a888338ef1ea3fd3ec6d1f279b73 [diff]
parent	90bac14f8ffc25414957ec05dff2dc66dbef937f [diff]